preprints.py 4.13 KB
Newer Older
1 2 3 4 5 6 7
# -*- coding: utf-8 -*-
""" harvest_tools.preprints

"""
import traceback


8
from automaton import Automaton
9
from base import family_name_fr, MSG_CRASH, MSG_LOAD
10
from invenio_tools import CheckException, RecordConf, RecordThesis
11 12 13
from plugin_dbui import UNDEF_ID


14 15 16 17
MSG_PREPRINT_IS_PAPER = "Reject preprint is a published paper"
MSG_PREPRINT_IS_CONFERENCE = "Reject preprint is a conference"
MSG_PREPRINT_IS_THESIS = "Reject preprint is a thesis"
MSG_PREPRINT_NO_NUMBER = "Reject no preprint number"
18 19


20
class Preprints(Automaton):
21
    """Automaton for preprints.
22 23

    """
24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60
    def check_record(self, record):
        """Check the content of the preprint in order to fix non conformities.

        @type record: L{Record}
        @param record:

        @rtype: bool
        @return: C{False} when a non conformity is found and can not be
        corrected.

        """
        if not Automaton.check_record(self, record):
            return False

        if self.dbg:
            print "select preprint record"

        if record.is_published():
            self.logs[-1].reject(MSG_PREPRINT_IS_PAPER, record.year())
            return False

        if isinstance(record, RecordConf):
            self.logs[-1].reject(MSG_PREPRINT_IS_CONFERENCE, record.year())
            return False

        if isinstance(record, RecordThesis):
            self.logs[-1].reject(MSG_PREPRINT_IS_THESIS, record.year())
            return False

        if not record.preprint_number():
            self.logs[-1].reject(MSG_PREPRINT_NO_NUMBER, record.year())
            return False

        try:
            self.check.submitted(record)
            self.check.year(record)

61 62 63 64
            self.check.format_authors(record, format_author_fr)
            self.check.get_my_authors(record, family_name_fr)
            self.check.fix_oai(record)

65 66 67 68 69 70 71 72 73 74
        except CheckException as e:
            self.logs[-1].reject(e, record.year())
            return False

        except Exception as e:
            self.logs[-1].reject(MSG_CRASH % e, record.year(), translate=False)
            print traceback.format_exc()
            return False

        return True
75

76 77
    def insert_record(self, record):
        """Insert a preprint in the database.
78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94

        @type record: L{Record}
        @param record:

        @rtype: int
        @return: one when the record is inserted / updated in the database
        zero otherwise.

        """
        # alias
        first_author = record.first_author()
        oai_url = record.oai_url()
        preprint = record.preprint_number()
        title = record.title()
        submitted = record.submitted()[0]
        year = record.year()

95
        # get the collaboration identifier
96
        id_collaboration = self.get_create_collaboration(record.collaboration())
97

98
        # get existing preprint or article
LE GAC Renaud's avatar
LE GAC Renaud committed
99 100 101 102 103 104 105 106 107 108
        fields = dict(first_author=first_author,
                      id_projects=self.id_project,
                      id_teams=self.id_team,
                      oai_url=oai_url,
                      preprint=preprint,
                      submitted=submitted,
                      title=title,
                      year=year)

        rec_id, status = self.get_record_by_fields(**fields)
109 110 111 112
        if rec_id:
            return status

        # eventually insert a new preprint
113
        ret = 1
114
        if not self.dry_run:
LE GAC Renaud's avatar
LE GAC Renaud committed
115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130
            fields = dict(authors=record.authors(),
                          authors_institute=record.my_authors,
                          first_author=first_author,
                          id_categories=self.id_category,
                          id_collaborations=id_collaboration,
                          id_projects=self.id_project,
                          id_status=UNDEF_ID,
                          id_teams=self.id_team,
                          origin=oai_url,
                          preprint=preprint,
                          publication_url=record.paper_url(),
                          submitted=submitted,
                          title=title,
                          year=year)

            ret = self._insert_in_db(log_year=year, **fields)
131 132 133 134 135 136

        if ret == 1:
            self.logs[-1].load(MSG_LOAD, year)
            return 1

        return 0