-
Notifications
You must be signed in to change notification settings - Fork 0
/
uf-drop
executable file
·73 lines (60 loc) · 2.15 KB
/
uf-drop
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
#!/bin/sh
#
# uf-drop - Drop characters from head of unfasta format sequences.
# Copyright (C) 2016 Marco van Zwetselaar <[email protected]>
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <http://www.gnu.org/licenses/>.
#
# This utility is part of http://io.zwets.it/unfasta
# Function to exit this script with an error message on stderr
err_exit() {
echo "$(basename "$0"): $*" >&2
exit 1
}
# Function to show usage information and exit
usage_exit() {
echo "
Usage: $(basename $0) [OPTIONS] NUM [FILE ...]
For each sequence in each unfasta format FILE drop the first NUM characters
and write the remainder of the sequence to standard output. If no FILE is
present or when FILE is '-', read standard input. With modifier -b|--but,
drop all except the final NUM characters.
Options
-b, --but Drop everything BUT the final NUM characters from each sequence.
-m, --mark Document the edit by appending '(uf:drop:[but:]NUM)' to headers.
" >&2
exit ${1:-1}
}
# Parse options
BUT=0
MARK=0
while [ $# -ne 0 -a "$(expr "$1" : '\(.\)..*')" = "-" ]; do
case $1 in
-m|--mark) MARK=1 ;;
-b|--but) BUT=1 ;;
-h|--help) usage_exit 0 ;;
*) usage_exit ;;
esac
shift || usage_exit
done
# Check first argument is positive number
[ $# -ge 1 -a "$(expr "$1" : '\([0-9]\+\)')" = "$1" ] || usage_exit
NUM=$1
shift
# Delegate to gawk
gawk -bO -v P="$(basename "$0")" -v N=$NUM -v M=$MARK -v B=$BUT '
NR%2==1 { print $0 (M ? " (uf:drop:" (B?"but:":"") N ")" : "") }
NR%2==0 { print B ? substr ($0,length($0)-N+1) : substr ($0,N+1) }
' "$@"
# vim: sts=4:sw=4:et:si:ai