| #!/bin/bash | |
| printHelp(){ | |
| echo "Please use the following command:" | |
| echo " ./compareVC.sh [Cosmas2 VC-file] [VC-file]" | |
| echo "" | |
| echo "The Cosmas2 virtual corpus should have the following format: " | |
| echo " <text>DOL00/JAN.00504</text>" | |
| echo "" | |
| echo "The other VC should contain a simple list of text Sigle, i.e. one text sigle per line. In the following format:" | |
| echo " DOL00/APR/00055" | |
| } | |
| vc1=$1 | |
| vc2=$2 | |
| if [ -z $1 ]||[ -z $2 ]; | |
| then | |
| printHelp | |
| exit | |
| fi | |
| firstLine="$(head -n 1 $vc1)" | |
| if ! [[ $firstLine =~ ^\<text\> ]]; | |
| then | |
| printHelp | |
| exit | |
| fi | |
| cat $vc1 | sed -E 's/<\/?text>//g' - | sed 's/\./\//' -| sort > vc1 | |
| cat $vc2 | sort > vc2 | |
| echo $1 | |
| wc -l vc1 | |
| echo $2 | |
| wc -l vc2 | |
| meld vc1 vc2 |