From ef583a04a2f39c77527363c2af37b7c1f53f91db Mon Sep 17 00:00:00 2001 From: Brandon Date: Fri, 27 Apr 2018 10:09:02 -0400 Subject: [PATCH] change directory and NER file link --- README.md | 21 +++++++++++++++++++++ batchner.sh | 2 +- 2 files changed, 22 insertions(+), 1 deletion(-) diff --git a/README.md b/README.md index c788465..07c0167 100644 --- a/README.md +++ b/README.md @@ -1 +1,22 @@ Batch script for Named Entity Recognition + +# Folder Setup +── project folder +├── stanford-er-2018-02-27 +├── file1.txt +├── file2.txt +├── file1.txt +├── file2.txt +│ ├── cgi +│ │ ├── cgi0.sh + + +── project folder + +├── batchner.sh +├── file1.txt +├── file2.txt +├── file3.txt +├── file4.txt + +── pr \ No newline at end of file diff --git a/batchner.sh b/batchner.sh index 48c7343..76d5d49 100644 --- a/batchner.sh +++ b/batchner.sh @@ -6,7 +6,7 @@ for file in *.txt do -nertext=$(../stanford-ner-2017-06-09/ner.sh $file) +nertext=$(stanford-ner-2018-02-27/ner.sh $file) echo $nertext | egrep -o "(([[:alnum:]]|\.)+/ORGANIZATION([[:space:]]|$))+" | sed 's/\/ORGANIZATION//g' | sort | uniq -c | awk -v name=${file##*/} '{printf name ","; for (i = 2; i < NF; i++) printf $i " "; printf $NF; printf "," "organization" ","; printf $1; print ""}' >> entities.csv