16 |
if (is(readerControl$reader, "FunctionGenerator")) |
if (is(readerControl$reader, "FunctionGenerator")) |
17 |
readerControl$reader <- readerControl$reader(...) |
readerControl$reader <- readerControl$reader(...) |
18 |
if (is.null(readerControl$language)) |
if (is.null(readerControl$language)) |
19 |
readerControl$language = "en_US" |
readerControl$language <- "en_US" |
20 |
if (is.null(readerControl$load)) |
if (is.null(readerControl$load) || (!object@LoDSupport)) |
21 |
readerControl$load = TRUE |
readerControl$load <- TRUE |
22 |
|
|
23 |
if (dbControl$useDb && require("filehash")) { |
if (dbControl$useDb && require("filehash")) { |
24 |
if (!dbCreate(dbControl$dbName, dbControl$dbType)) |
if (!dbCreate(dbControl$dbName, dbControl$dbType)) |
32 |
else |
else |
33 |
list() |
list() |
34 |
|
|
35 |
|
if ((!dbControl$useDb) && object@Vectorized) |
36 |
|
tdl <- lapply(mapply(c, pGetElem(object), id = seq_len(object@Length), SIMPLIFY = FALSE), |
37 |
|
function(x) readerControl$reader(x[c("content", "uri")], |
38 |
|
readerControl$load, |
39 |
|
readerControl$language, |
40 |
|
as.character(x$id))) |
41 |
|
else { |
42 |
counter <- 1 |
counter <- 1 |
43 |
while (!eoi(object)) { |
while (!eoi(object)) { |
44 |
object <- stepNext(object) |
object <- stepNext(object) |
45 |
elem <- getElem(object) |
elem <- getElem(object) |
|
# If there is no Load on Demand support |
|
|
# we need to load the corpus into memory at startup |
|
|
if (!object@LoDSupport) |
|
|
readerControl$load <- TRUE |
|
46 |
doc <- readerControl$reader(elem, readerControl$load, readerControl$language, as.character(counter)) |
doc <- readerControl$reader(elem, readerControl$load, readerControl$language, as.character(counter)) |
47 |
if (dbControl$useDb && require("filehash")) { |
if (dbControl$useDb && require("filehash")) { |
48 |
dbInsert(db, ID(doc), doc) |
dbInsert(db, ID(doc), doc) |
59 |
} |
} |
60 |
counter <- counter + 1 |
counter <- counter + 1 |
61 |
} |
} |
62 |
|
} |
63 |
|
|
64 |
df <- data.frame(MetaID = rep(0, length(tdl)), stringsAsFactors = FALSE) |
df <- data.frame(MetaID = rep(0, length(tdl)), stringsAsFactors = FALSE) |
65 |
if (dbControl$useDb && require("filehash")) { |
if (dbControl$useDb && require("filehash")) { |