Extract the first two columns (token, token/POS) from .tag files: (1) .2col file preparation: > cat 302000.tag | awk '{print $1, $2}' | sed 's/EOS//' | sed 's/[#\^]//' | sed 's/\+DEP//' | sed 's/DEP//' | sed 's/DEP\+//' >! 302000.tag.2col (2) .1col file preparation: > cat 302000.tag.2col | awk '{print $2}' | awk '{FS="+"} {for (i=1; i <= NF; i+=1) {printf($i"\n")}}' > 302000.tag.1col (3) .1col-2 file preparation: > cat 302000.tag.1col | awk '{FS="/"} {print $1, "\t", $2}' > 302000.tag.1col-2 (4) .1col.rom file preparation: > cat 302000.tag.1col | awk '{FS="/"} {print $1}' | /home/kyoon/han2phon | sed 's/ae/e/g' | sed 's/oe/we/g' | sed 's/yi/eui/g' > 302000.tag.1col.rom (5) .rom.han.pos file preparation: > paste 302000.tag.1col.rom 302000.tag.1col-2 > 302000.rom.han.pos