#!/bin/sh
###########################################################################
##                                                                       ##
##                  Language Technologies Institute                      ##
##                    Carnegie Mellon University                         ##
##                         Copyright (c) 2002                            ##
##                        All Rights Reserved.                           ##
##                                                                       ##
##  Permission is hereby granted, free of charge, to use and distribute  ##
##  this software and its documentation without restriction, including   ##
##  without limitation the rights to use, copy, modify, merge, publish,  ##
##  distribute, sublicense, and/or sell copies of this work, and to      ##
##  permit persons to whom this work is furnished to do so, subject to   ##
##  the following conditions:                                            ##
##   1. The code must retain the above copyright notice, this list of    ##
##      conditions and the following disclaimer.                         ##
##   2. Any modifications must be clearly marked as such.                ##
##   3. Original authors' names are not deleted.                         ##
##   4. The authors' names are not used to endorse or promote products   ##
##      derived from this software without specific prior written        ##
##      permission.                                                      ##
##                                                                       ##
##  CARNEGIE MELLON UNIVERSITY AND THE CONTRIBUTORS TO THIS WORK         ##
##  DISCLAIM ALL WARRANTIES WITH REGARD TO THIS SOFTWARE, INCLUDING      ##
##  ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS, IN NO EVENT   ##
##  SHALL CARNEGIE MELLON UNIVERSITY NOR THE CONTRIBUTORS BE LIABLE      ##
##  FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES    ##
##  WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN   ##
##  AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION,          ##
##  ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF       ##
##  THIS SOFTWARE.                                                       ##
##                                                                       ##
###########################################################################
##                                                                       ##
##   data_minus a.data b.data >a-b.data                                  ##
##                                                                       ##
##   Uses the fileid alone so b.data needn't have the same textual vals  ##
##   as a.data so you can use this to remove segs from txt files         ##
##                                                                       ##
###########################################################################

if [ $# = 0 ]
then
   echo "Substract a set of prompts from a given prompt set"
   echo 'assumes $2 is the file id'
   echo "Usage:  dataset_minus a.data b.data >a-b.data"
   exit 1
fi

LANG=C; export LANG

TFILENAMEBASE=/tmp/ds_min_$$
cat $1 >$TFILENAMEBASE.1
for i in `awk '{print $2}' $2`
do
   grep -v "( "$i" " $TFILENAMEBASE.1 >$TFILENAMEBASE.2
   mv $TFILENAMEBASE.2 $TFILENAMEBASE.1
done
cat $TFILENAMEBASE.1
rm $TFILENAMEBASE.1

