- Notifications
You must be signed in to change notification settings - Fork 38
/
Copy pathrepo_request.py
106 lines (81 loc) · 2.76 KB
/
repo_request.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
importhashlib
importre
fromsqlalchemyimportand_
fromappimportdb
fromendpointimportEndpoint
fromrepositoryimportRepository
classRepoRequest(db.Model):
id=db.Column(db.Text, primary_key=True)
updated=db.Column(db.DateTime)
email=db.Column(db.Text)
pmh_url=db.Column(db.Text)
repo_name=db.Column(db.Text)
institution_name=db.Column(db.Text)
examples=db.Column(db.Text)
repo_home_page=db.Column(db.Text)
comments=db.Column(db.Text)
pmh_set=db.Column(db.Text)
metadata_prefix=db.Column(db.Text)
duplicate_request=db.Column(db.Text)
def__init__(self, **kwargs):
super(self.__class__, self).__init__(**kwargs)
# trying to make sure the rows are unique
defset_id_seed(self, id_seed):
self.id=hashlib.md5(id_seed.encode('utf-8')).hexdigest()[0:6]
@classmethod
deflist_fieldnames(self):
# these are the same order as the columns in the input google spreadsheet
fieldnames= [
"id",
"updated",
"email",
"pmh_url",
"repo_name",
"institution_name",
"examples",
"repo_home_page",
"comments",
"pmh_set",
"metadata_prefix",
"duplicate_request",
]
returnfieldnames
@property
defis_duplicate(self):
returnself.duplicate_request=="dup"
@property
defendpoints(self):
return []
@property
defrepositories(self):
return []
defmatching_endpoints(self):
response=self.endpoints
ifnotself.pmh_url:
returnresponse
url_fragments=re.findall('//([^/]+/[^/]+)', self.pmh_url)
ifnoturl_fragments:
returnresponse
matching_endpoints_query=Endpoint.query.filter(Endpoint.pmh_url.ilike("%{}%".format(url_fragments[0])))
hits=matching_endpoints_query.all()
ifhits:
response+=hits
returnresponse
defmatching_repositories(self):
response=self.repositories
ifnotself.institution_nameornotself.repo_name:
returnresponse
matching_query=Repository.query.filter(and_(
Repository.institution_name.ilike("%{}%".format(self.institution_name)),
Repository.repository_name.ilike("%{}%".format(self.repo_name))))
hits=matching_query.all()
ifhits:
response+=hits
returnresponse
defto_dict(self):
response= {}
forfieldnameinRepoRequest.list_fieldnames():
response[fieldname] =getattr(self, fieldname)
returnresponse
def__repr__(self):
return"<RepoRequest ( {} ) {}>".format(self.id, self.pmh_url)