# Extract genetic codes from a web page like the ones found on NCBI. /<\/pre>/ { printing=0; } /^ *(<[Hh]3>)? *[1-9][0-9]?\. *.*\(transl_table=[1-9][0-9]*\)/ { gsub( / *<[^>]+> */, "" ); # Remove tags. n = split( $0, a, /[()]/ ); n = split( a[2], b, /=/ ); n = b[2]; gsub( /\([^)]*\)/, "" ); # Remove parenthetical content. sub( /^ *[1-9][0-9]*\. /, "" ); # Remove number. gsub( / +/, "" ); # Remove spaces. print; } /^ AAs = / /^ Starts = / /^ Base[123] = / { print; } /
/ {
  printing=1;
}