ConferenceCorpus: Difference between revisions
Jump to navigation
Jump to search
(→Issues) |
(→Event) |
||
| Line 81: | Line 81: | ||
title | title | ||
ConfIDent Event | ConfIDent Event | ||
2022-04-06 | |||
[[https://projects.tib.eu/en/confident/ © 2019- | [[https://projects.tib.eu/en/confident/ © 2019-2022 ConfIDent project]] | ||
see also [[http://ptp.bitplan.com/settings Proceedings Title Parser]] | see also [[http://ptp.bitplan.com/settings Proceedings Title Parser]] | ||
| Line 89: | Line 89: | ||
class Event << Entity >> { | class Event << Entity >> { | ||
acronym : TEXT | acronym : TEXT | ||
eventId : TEXT | eventId : TEXT | ||
ordinal : INTEGER | |||
source : TEXT | source : TEXT | ||
title : TEXT | title : TEXT | ||
year : INTEGER | |||
} | |||
class event_ceurws << Entity >> { | |||
city : TEXT | |||
country : TEXT | |||
daterange : TEXT | |||
debug : BOOLEAN | |||
delimiter : TEXT | |||
description : TEXT | |||
enum : TEXT | |||
eventType : TEXT | |||
extract : TEXT | |||
field : TEXT | |||
frequency : TEXT | |||
location : TEXT | |||
lookupAcronym : TEXT | |||
month : TEXT | |||
organization : TEXT | |||
prefix : TEXT | |||
province : TEXT | |||
publish : TEXT | |||
scope : TEXT | |||
syntax : TEXT | |||
topic : TEXT | |||
url : TEXT | url : TEXT | ||
valid : BOOLEAN | |||
volume : INTEGER | |||
} | |||
class event_tibkat << Entity >> { | |||
alternativeTitles : TEXT | |||
authorGndId : TEXT | |||
bk : TEXT | |||
changeDate : TEXT | |||
corporateCreatorNames : TEXT | |||
corporateCreatorTypes : TEXT | |||
databaseDate : TEXT | |||
dates : TEXT | |||
ddc : TEXT | |||
description : TEXT | |||
documentGenreCode : TEXT | |||
documentId : TEXT | |||
documentTypeCode : TEXT | |||
doi : TEXT | |||
ean : TEXT | |||
endDate : DATE | |||
event : TEXT | |||
firstid : TEXT | |||
ftxCreationDate : TEXT | |||
gndIds : TEXT | |||
isbn : TEXT | |||
isbn13 : TEXT | |||
journalTitle : TEXT | |||
journalVolumeNumber : TEXT | |||
location : TEXT | |||
ppn : TEXT | |||
publisher : TEXT | |||
pubplace : TEXT | |||
pubyear : TEXT | |||
sponsorGndId : TEXT | |||
startDate : DATE | |||
} | |||
class event_gnd << Entity >> { | |||
acronymCount : INTEGER | |||
acronyms : TEXT | |||
date : TEXT | |||
dateCount : INTEGER | |||
endDate : DATE | |||
event : TEXT | |||
fulltitle : TEXT | |||
homepage : TEXT | |||
location : TEXT | |||
organization : TEXT | |||
place : TEXT | |||
placeCount : INTEGER | |||
places : TEXT | |||
startDate : DATE | |||
variant : TEXT | |||
variantCount : INTEGER | |||
variants : TEXT | |||
} | } | ||
class event_orclone << Entity >> { | class event_orclone << Entity >> { | ||
DblpConferenceId : TEXT | |||
ISBN : TEXT | |||
TibKatId : TEXT | |||
acceptedPapers : INTEGER | acceptedPapers : INTEGER | ||
city : TEXT | |||
country : TEXT | |||
creationDate : TIMESTAMP | creationDate : TIMESTAMP | ||
endDate : TIMESTAMP | endDate : TIMESTAMP | ||
| Line 110: | Line 187: | ||
lastEditor : TEXT | lastEditor : TEXT | ||
modificationDate : TIMESTAMP | modificationDate : TIMESTAMP | ||
pageTitle : TEXT <<PK>> | pageTitle : TEXT <<PK>> | ||
region : TEXT | region : TEXT | ||
startDate : TIMESTAMP | startDate : TIMESTAMP | ||
submittedPapers : INTEGER | submittedPapers : INTEGER | ||
url : TEXT | |||
wikidataId : TEXT | |||
yearStr : TEXT | yearStr : TEXT | ||
} | } | ||
class event_wikidata << Entity >> { | |||
country : TEXT | |||
countryId : TEXT | |||
dblpId : TEXT | |||
class | describedAtUrl : TEXT | ||
doi : TEXT | |||
endDate : TEXT | endDate : TIMESTAMP | ||
eventInSeries : TEXT | |||
eventInSeriesId : TEXT | |||
eventTitle : TEXT | |||
followedById : TEXT | |||
gndId : TEXT | |||
homepage : TEXT | homepage : TEXT | ||
language : TEXT | |||
location : TEXT | |||
locationId : TEXT | |||
mainSubject : TEXT | |||
ppn : TEXT | |||
proceedings : TEXT | |||
proceedingsLabel : TEXT | |||
startDate : TIMESTAMP | |||
url : TEXT | |||
wikiCfpId : TEXT | |||
} | } | ||
class event_crossref << Entity >> { | class event_crossref << Entity >> { | ||
doi : TEXT | doi : TEXT | ||
endDate : DATE | endDate : DATE | ||
| Line 163: | Line 226: | ||
name : TEXT | name : TEXT | ||
number : TEXT | number : TEXT | ||
sponsor : TEXT | sponsor : TEXT | ||
startDate : DATE | startDate : DATE | ||
theme : TEXT | theme : TEXT | ||
url : TEXT | |||
} | } | ||
class event_dblp << Entity >> { | |||
booktitle : TEXT | |||
doi : TEXT | |||
ee : TEXT | |||
class | |||
endDate : TIMESTAMP | endDate : TIMESTAMP | ||
isbn : TEXT | |||
mdate : TEXT | |||
publicationSeries : TEXT | |||
series : TEXT | |||
startDate : TIMESTAMP | startDate : TIMESTAMP | ||
url : TEXT | |||
} | } | ||
class event_wikicfp << Entity >> { | class event_wikicfp << Entity >> { | ||
Final_Version_Due : TEXT | Final_Version_Due : TEXT | ||
Notification_Due : TIMESTAMP | Notification_Due : TIMESTAMP | ||
Submission_Deadline : TIMESTAMP | Submission_Deadline : TIMESTAMP | ||
deleted : BOOLEAN | |||
deleted : | |||
endDate : TIMESTAMP | endDate : TIMESTAMP | ||
eventType : TEXT | eventType : TEXT | ||
locality : TEXT | locality : TEXT | ||
series : TEXT | series : TEXT | ||
seriesId : TEXT | seriesId : TEXT | ||
startDate : TIMESTAMP | startDate : TIMESTAMP | ||
url : TEXT | |||
wikiCfpId : INTEGER | wikiCfpId : INTEGER | ||
} | } | ||
class event_orclonebackup << Entity >> { | |||
DblpConferenceId : TEXT | |||
ISBN : TEXT | |||
acceptedPapers : TEXT | |||
class | city : TEXT | ||
country : TEXT | |||
endDate : TIMESTAMP | endDate : TIMESTAMP | ||
eventType : TEXT | eventType : TEXT | ||
homepage : TEXT | homepage : TEXT | ||
inEventSeries : TEXT | inEventSeries : TEXT | ||
pageTitle : TEXT <<PK>> | pageTitle : TEXT <<PK>> | ||
presence : TEXT | |||
region : TEXT | region : TEXT | ||
startDate : TIMESTAMP | startDate : TIMESTAMP | ||
submittedPapers : | submittedPapers : TEXT | ||
url : TEXT | |||
wikiMarkup : TEXT | |||
wikicfpId : TEXT | |||
wikidataId : TEXT | |||
yearStr : TEXT | yearStr : TEXT | ||
} | } | ||
class event_confref << Entity >> { | |||
area : TEXT | |||
city : TEXT | |||
country : TEXT | |||
class | dblpSeriesId : TEXT | ||
endDate : TEXT | endDate : TEXT | ||
keywords : TEXT | |||
ranks : TEXT | |||
seriesId : TEXT | |||
seriesTitle : TEXT | |||
startDate : TEXT | startDate : TEXT | ||
submissionExtended : BOOLEAN | |||
url : TEXT | |||
} | } | ||
Event <|-- event_ceurws | |||
Event <|-- event_tibkat | |||
Event <|-- event_gnd | |||
Event <|-- event_orclone | Event <|-- event_orclone | ||
Event <|-- event_wikidata | |||
Event <|-- event_crossref | |||
Event <|-- event_dblp | |||
Event <|-- event_wikicfp | |||
Event <|-- event_orclonebackup | Event <|-- event_orclonebackup | ||
Event <|-- event_confref | Event <|-- event_confref | ||
} | } | ||
Revision as of 06:05, 6 April 2022
OsProject
| OsProject | |
|---|---|
| id | ConferenceCorpus |
| state | active |
| owner | WolfgangFahl |
| title | Scientific Event Corpus |
| url | https://github.com/WolfgangFahl/ConferenceCorpus |
| version | 0.0.10 |
| description | |
| date | 2021-08-03 |
| since | 2021-07-26 |
| until | |
Freitext
Installation
via pip
pip install ConferenceCorpus
# alternatively if your pip is not a python3 pip
pip3 install ConferenceCorpus
upgrade
pip install ConferenceCorpus -U
# alternatively if your pip is not a python3 pip
pip3 install ConferenceCorpus -U
Usage
RESTFul API
Examples
- https://conferencecorpus.bitplan.com/eventseries/WEBIST?format=json
- https://conferencecorpus.bitplan.com/eventseries/WEBIST?format=html
- https://conferencecorpus.bitplan.com/eventseries/ISWC?format=json
- https://conferencecorpus.bitplan.com/eventseries/ISWC?format=html
Database View with Sqlite
The EventCorpus.db is in Sqlite format.
using sqlite-web
pip install sqlite-web
sqlite_web $HOME/.conferencecorpus/EventCorpus.db
There is convenience script ccsqliteweb available in the scripts directory which will also kill an existing sqlite_web EventCorpus.db process and run the server in background using nohup.
Command Line
aelookup -h
usage: aelookup [-h] [-d] [-e ENDPOINT] [-v] [-u] [-f]
[--datasources DATASOURCES]
Scientific Event Corpus and Lookup
Created by Wolfgang Fahl on 2020-06-22.
Copyright 2020-2021 Wolfgang Fahl. All rights reserved.
Licensed under the Apache License 2.0
http://www.apache.org/licenses/LICENSE-2.0
Distributed on an "AS IS" basis without warranties
or conditions of any kind, either express or implied.
USAGE
optional arguments:
-h, --help show this help message and exit
-d, --debug show debug info
-e ENDPOINT, --endpoint ENDPOINT
SPARQL endpoint to use for wikidata queries
-v, --version show program's version number and exit
-u, --uml output plantuml diagram markup
-f, --force force Update - may take quite a time
--datasources DATASOURCES
, delimited list of datasource lookup ids
Overview
Datasources
You might want to open the diagrams in a new tab to be able to click the links depicted.
Event
EventSeries
Updating the database
Openresearch
scripts/getbackup
gets a copy of the nightly OpenResearch backups
Issues
- Issue 33 - Event series completion
- Issue 32 - regression TemplateNotFound: fb4common/base.html
- Issue 31 - Provide RDF export of the data
- Issue 30 - add ordinal distribution query✓
- Issue 29 - add scholar RESTFul API
- Issue 28 - add generic search for scholarly items
- Issue 27 - openresearch results missing in multiquery
- Issue 26 - add bib file import
- Issue 25 - make multiquery result available via webapi with content negotiation✓
- Issue 24 - allow updating the database via webserver
- Issue 23 - dictOfLod Lookup result via commandline
- Issue 22 - add multi query option✓
- Issue 21 - add Webserver✓
- Issue 20 - Work around upstream Nominatim OSM Pythontools issue✓
- Issue 19 - Update Openresearch Samples✓
- Issue 18 - Update requirements.txt✓
- Issue 17 - include ACM digital library as a source
- Issue 16 - Steps towards csv upload✓
- Issue 15 - Filter obviously invalid Series and Event entries✓
- Issue 14 - wikiCFP 500 Internal Server and TimeOut Error Handling✓
- Issue 12 - Relevant FTX fields
- Issue 11 - Locality fixes
- Issue 10 - OpenResearch export option
- Issue 9 - offline access to EventCorpus.db
- Issue 8 - migrate confref data from Proceedings Title Parser here✓
- Issue 7 - migrate crossref data from proceedings title parser here✓
- Issue 6 - migrate dblp data source here from ptp and dblpconf✓
- Issue 5 - dblp xml parser skips some proceedings titles
- Issue 4 - add commandline interface to CorpusLookup✓
- Issue 3 - add python api doc✓
- Issue 2 - Cache all SQL tables in the same SQLite database in a ".conferencecorpus" directory✓
- Issue 1 - There should be a common set of attributes for Event and EventSeries from different datasources