update
This commit is contained in:
@@ -12,7 +12,7 @@ query.sh
|
|||||||
|
|
||||||
## 1. Verzamelen van berichten
|
## 1. Verzamelen van berichten
|
||||||
|
|
||||||
Berichten van NieuwsNL in `NieuwsNL/yyyy/mm/dd/`
|
Berichten van NieuwsNL in `NieuwsNL/yyyy/mm/dd/` TODO
|
||||||
|
|
||||||
Overigen in `[A-Z]*/yyyy/ww/` (weeknummer)
|
Overigen in `[A-Z]*/yyyy/ww/` (weeknummer)
|
||||||
|
|
||||||
1
README.user.md
Normal file
1
README.user.md
Normal file
@@ -0,0 +1 @@
|
|||||||
|
TODO
|
||||||
@@ -1,5 +1,5 @@
|
|||||||
nw <- read.table('data/2026/algemeen-count-per-2026.23-1', sep="\t", quote="", encoding="utf-8", col.names=c("f", "word"))
|
nw <- read.table('data/2026/algemeen-allewoorden-2026.23-1', sep="\t", quote="", encoding="utf-8", col.names=c("f", "word", "tags"))
|
||||||
od <- read.table('data/2026/algemeen-count-per-2026.22-4', sep="\t", quote="", encoding="utf-8", col.names=c("f", "word"))
|
od <- read.table('data/2026/algemeen-allewoorden-2026.22-4', sep="\t", quote="", encoding="utf-8", col.names=c("f", "word", "tags"))
|
||||||
words <- unique(c(od$word, nw$word))
|
words <- unique(c(od$word, nw$word))
|
||||||
o <- order(words)
|
o <- order(words)
|
||||||
words <- words[o]
|
words <- words[o]
|
||||||
@@ -26,3 +26,8 @@ nieuw[nieuw == 0] <- 0.5
|
|||||||
plot(log(oud), log(nieuw))
|
plot(log(oud), log(nieuw))
|
||||||
lines(log(range(oud)), log(range(nieuw)))
|
lines(log(range(oud)), log(range(nieuw)))
|
||||||
identify(log(oud), log(nieuw), labels=words)
|
identify(log(oud), log(nieuw), labels=words)
|
||||||
|
|
||||||
|
|
||||||
|
#plot(oud, nieuw)
|
||||||
|
#lines(range(oud), range(nieuw))
|
||||||
|
#identify(oud, nieuw, labels=words)
|
||||||
|
|||||||
Reference in New Issue
Block a user