preprints.py 4.11 KB
Newer Older
1 2 3 4 5 6 7
# -*- coding: utf-8 -*-
""" harvest_tools.preprints

"""
import traceback


8
from automaton import Automaton
LE GAC Renaud's avatar
LE GAC Renaud committed
9
from base import family_name_fr, format_author_fr, MSG_CRASH, MSG_LOAD
10
from invenio_tools import CheckException, RecordConf, RecordThesis
11 12 13
from plugin_dbui import UNDEF_ID


14 15 16 17
MSG_PREPRINT_IS_PAPER = "Reject preprint is a published paper"
MSG_PREPRINT_IS_CONFERENCE = "Reject preprint is a conference"
MSG_PREPRINT_IS_THESIS = "Reject preprint is a thesis"
MSG_PREPRINT_NO_NUMBER = "Reject no preprint number"
18 19


20
class Preprints(Automaton):
21
    """Automaton for preprints.
22 23

    """
24 25 26 27 28 29 30 31 32 33 34 35 36 37 38
    def check_record(self, record):
        """Check the content of the preprint in order to fix non conformities.

        @type record: L{Record}
        @param record:

        @rtype: bool
        @return: C{False} when a non conformity is found and can not be
        corrected.

        """
        if not Automaton.check_record(self, record):
            return False

        if self.dbg:
LE GAC Renaud's avatar
LE GAC Renaud committed
39
            print "check preprint record"
40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60

        if record.is_published():
            self.logs[-1].reject(MSG_PREPRINT_IS_PAPER, record.year())
            return False

        if isinstance(record, RecordConf):
            self.logs[-1].reject(MSG_PREPRINT_IS_CONFERENCE, record.year())
            return False

        if isinstance(record, RecordThesis):
            self.logs[-1].reject(MSG_PREPRINT_IS_THESIS, record.year())
            return False

        if not record.preprint_number():
            self.logs[-1].reject(MSG_PREPRINT_NO_NUMBER, record.year())
            return False

        try:
            self.check.submitted(record)
            self.check.year(record)

61 62 63
            self.check.format_authors(record, format_author_fr)
            self.check.get_my_authors(record, family_name_fr)

64 65 66 67 68 69 70 71 72 73
        except CheckException as e:
            self.logs[-1].reject(e, record.year())
            return False

        except Exception as e:
            self.logs[-1].reject(MSG_CRASH % e, record.year(), translate=False)
            print traceback.format_exc()
            return False

        return True
74

75 76
    def insert_record(self, record):
        """Insert a preprint in the database.
77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93

        @type record: L{Record}
        @param record:

        @rtype: int
        @return: one when the record is inserted / updated in the database
        zero otherwise.

        """
        # alias
        first_author = record.first_author()
        oai_url = record.oai_url()
        preprint = record.preprint_number()
        title = record.title()
        submitted = record.submitted()[0]
        year = record.year()

94
        # get the collaboration identifier
95
        id_collaboration = self.get_create_collaboration(record.collaboration())
96

97
        # get existing preprint or article
LE GAC Renaud's avatar
LE GAC Renaud committed
98 99 100 101 102 103 104 105 106 107
        fields = dict(first_author=first_author,
                      id_projects=self.id_project,
                      id_teams=self.id_team,
                      oai_url=oai_url,
                      preprint=preprint,
                      submitted=submitted,
                      title=title,
                      year=year)

        rec_id, status = self.get_record_by_fields(**fields)
108 109 110 111
        if rec_id:
            return status

        # eventually insert a new preprint
112
        ret = 1
113
        if not self.dry_run:
LE GAC Renaud's avatar
LE GAC Renaud committed
114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129
            fields = dict(authors=record.authors(),
                          authors_institute=record.my_authors,
                          first_author=first_author,
                          id_categories=self.id_category,
                          id_collaborations=id_collaboration,
                          id_projects=self.id_project,
                          id_status=UNDEF_ID,
                          id_teams=self.id_team,
                          origin=oai_url,
                          preprint=preprint,
                          publication_url=record.paper_url(),
                          submitted=submitted,
                          title=title,
                          year=year)

            ret = self._insert_in_db(log_year=year, **fields)
130 131 132 133 134 135

        if ret == 1:
            self.logs[-1].load(MSG_LOAD, year)
            return 1

        return 0