-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathcreate_exfor_mongodb.R
More file actions
72 lines (63 loc) · 2.29 KB
/
create_exfor_mongodb.R
File metadata and controls
72 lines (63 loc) · 2.29 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
# The MIT License
#
# Copyright (c) 2019 Georg Schnabel
#
# Permission is hereby granted, free of charge,
# to any person obtaining a copy of this software and
# associated documentation files (the "Software"), to
# deal in the Software without restriction, including
# without limitation the rights to use, copy, modify,
# merge, publish, distribute, sublicense, and/or sell
# copies of the Software, and to permit persons to whom
# the Software is furnished to do so,
# subject to the following conditions:
#
# The above copyright notice and this permission notice
# shall be included in all copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
# EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
# OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
# IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR
# ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
# TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
# SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
#
# load necessary packages and script modules
library(mongolite)
library(data.table)
library(exforParser)
exforFiles <- list.files("<PATH TO DIRECTORY WITH EXFOR ENTRIES>",
pattern="entry.*txt", full.names=TRUE)
m <- mongo("entries",db="exfor",url="mongodb://localhost")
errorCounter <- 0
errorFiles <- character(0)
# loop over entries
for (idx in seq_along(exforFiles)) {
cat("read file ", idx, " of ", length(exforFiles), "\n")
curFile <- exforFiles[idx]
curText <- try(readChar(curFile, file.info(curFile)$size), silent=TRUE)
if ("try-error" %in% class(curText))
{
cat("Problems reading ", curFile, "\n")
errorCounter <- errorCounter + 1
errorFiles <- c(errorFiles, curFile)
next
}
curEntry <- parseEntry(curText)
firstSub <- NULL
# loop over subentries
for (idx2 in seq_along(curEntry$SUBENT)) {
curSub <- curEntry$SUBENT[[idx2]]
if (idx2==1)
{
firstSub <- curSub
}
else
{
curSub <- transformSubent(firstSub,curSub)
}
jsonObj <- convToJSON(curSub)
m$insert(jsonObj)
}
}