@@ -9,29 +9,28 @@ class Cord19Dataset(BaseDataSet):
9
9
topic = "Covid-19"
10
10
license = "Covid dataset license"
11
11
link = "https://pages.semanticscholar.org/coronavirus-research"
12
- last_update = "2020-03-13 "
12
+ last_update = "2020-03-20 "
13
13
description = "A free dataset on publications on the corona virus."
14
14
img_url = ("https://pages.semanticscholar.org/hs-fs/hubfs/"
15
15
"covid-image.png?width=300&name=covid-image.png" )
16
16
link = "https://pages.semanticscholar.org/coronavirus-research"
17
17
year = 2020
18
18
19
19
20
- class Cord19DatasetV3 (Cord19Dataset ):
21
- dataset_id = "cord19-v3 "
22
- title = "CORD-19 v3 "
23
- sha512 = ("6741211cc47c04897b253a3eaf2d18e6d57391530f8cebe7d8c84310f82 "
24
- "c90b2c55071157b418fb7b627302adbfae8838fb8c071516288b320b131 "
25
- "03ac1ec7fc " )
20
+ class Cord19DatasetV4 (Cord19Dataset ):
21
+ dataset_id = "cord19-v4 "
22
+ title = "CORD-19 v4 "
23
+ sha512 = ("517e2399767aa1d387baaa07c42ef6ac9a5aec1e3a41f832974ee712413 "
24
+ "272429f2a5ea658b32bb7330becac70df1ee5262ae1ddebb258a02aaaa2 "
25
+ "d4b47335cc " )
26
26
27
- date = "2020-03-13 "
27
+ date = "2020-03-20 "
28
28
statistics = {
29
- "n_papers" : 29500 ,
30
- "n_missing_titles" : 9 ,
31
- "n_missing_abstracts" : 2591 ,
29
+ "n_papers" : 44220 ,
30
+ "n_missing_titles" : 224 ,
31
+ "n_missing_abstracts" : 8414 ,
32
32
}
33
- url = ("https://ai2-semanticscholar-cord-19.s3-us-west-2.amazonaws.com/"
34
- "2020-03-13/all_sources_metadata_2020-03-13.csv" )
33
+ url = ("https://ai2-semanticscholar-cord-19.s3-us-west-2.amazonaws.com/2020-03-20/metadata.csv" )
35
34
36
35
37
36
class Cord19DatasetV4_Dec2019 (Cord19Dataset ):
@@ -58,6 +57,6 @@ class Covid19DataGroup(BaseDataGroup):
58
57
59
58
def __init__ (self ):
60
59
super (Covid19DataGroup , self ).__init__ (
61
- Cord19DatasetV3 (),
60
+ Cord19DatasetV4 (),
62
61
Cord19DatasetV4_Dec2019 (),
63
62
)
0 commit comments