| #!/bin/bash | 
 |  | 
 | printHelp(){ | 
 |   echo "Please use the following command:" | 
 |   echo "  ./compareVC.sh [Cosmas2 VC-file] [VC-file]" | 
 |   echo "" | 
 |   echo "The Cosmas2 virtual corpus should have the following format: " | 
 |   echo "  <text>DOL00/JAN.00504</text>" | 
 |   echo "" | 
 |   echo "The other VC should contain a simple list of text Sigle, i.e. one text sigle per line. In the following format:" | 
 |   echo "  DOL00/APR/00055" | 
 | } | 
 |  | 
 | vc1=$1 | 
 | vc2=$2 | 
 |  | 
 | if [ -z $1 ]||[ -z $2 ]; | 
 | then | 
 |     printHelp | 
 |     exit | 
 | fi | 
 |  | 
 | firstLine="$(head -n 1 $vc1)" | 
 |  | 
 | if ! [[ $firstLine =~ ^\<text\> ]]; | 
 | then | 
 |   printHelp | 
 |   exit | 
 | fi | 
 |  | 
 | cat $vc1 | sed -E 's/<\/?text>//g' - |  sed 's/\./\//' -| sort > vc1 | 
 |  | 
 | cat $vc2 | sort > vc2 | 
 |  | 
 | echo $1 | 
 | wc -l vc1 | 
 | echo $2 | 
 | wc -l vc2 | 
 |  | 
 | meld vc1 vc2 |