Commit 07052fcc authored by Neeme Kahusk's avatar Neeme Kahusk
Browse files

unique synset numbers

parent e134b523
......@@ -27,12 +27,15 @@ else
cat $1 |grep '^0'|sed -E 's/(0 @)([0-9]+)(@.+$)/\2/g'|sort|uniq > all.numbers
cat $1 |grep '^0'|sed -E 's/(0 @)([0-9]+)(@.+$)/\2/g'|sort|uniq -c|sort -nr|egrep '^ {3}[2-9]'|sed -E 's/^ {3}[2-9] //g' > doubled.numbers
cp $1 tempfile
python unique_synsets.py all.numbers doubled.numbers tempfile > $EXPORTFILE
# rm all.numbers
# rm doubled.numbers
fi
echo "$NO_OF_ORIGSYNSETS"
echo "$NO_OF_UNIQESYNSETS"
exit
# all operations are done on NORMFILE!
# extensions of index files
......
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
Supports Markdown
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment