forked from dilawar/Scripts
-
Notifications
You must be signed in to change notification settings - Fork 0
/
csv2gnuplot.sh
executable file
·376 lines (340 loc) · 8.84 KB
/
csv2gnuplot.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
#!/bin/bash
#
# This transforms a CSV file into a gnuplot file.
# use option '-h' to display a help screen for all options.
#
# FracPete (original script)
# Ben Cot (improved usage screen)
# the usage of this script
function usage()
{
cat << usage_info >&2
usage: $0 [-i <file>] [-o <file>] [-g <file>] [-G <file>] [-O <file>]
[-d <delim>] [-t] [-x] [-a] [-l] [-T]
[-W <width> -H <height>] [-F <x11|png|ps>] [-b <files>] [-e] [-h]
Transforms a given CSV file into a gnuplot input file. It can also
produce a gnuplot script for plotting the data, as well as batch
processing of several files with automatic output generation.
-h Show this help information
Input/Output:
-i <file> input filename
-o <file> output filename
-g <file> generates a gnuplot script with this name to display
the data, it assumes that the first column is the index
for the x-axis.
In combination with '-b' this parameter is only used to
indicate that a script is wanted, the filename itself is
ignored.
-G <file> a file containing gnuplot options, comments etc. to be added
before the plots
-O <file> generates a script that outputs the plot in the
format specified with '-F' in a file with the given name,
instead of displaying it in a window
CSV/Data:
-d <delim> the delimiter that separates the columns, default: $DELIMITER
-t transposes the matrix first
-x adds a column for the x-axis (numbers starting from 1)
-a generates the average of the columns
-l adds 'with lines' to the gnuplot script
-T adds a number as title to the gnuplot script
GNUPlot Output:
-F <x11|png|ps> the format of the output, default: $FORMAT
-W <width> the width of the output (if '-F png'), default: $WIDTH
-H <height> the height of the output (if '-F png'), default: $HEIGHT
-b <files> processes the given files in batch mode,
i.e. '-i' and '-o' are not necessary.
the files get new extensions automatically.
-e generates the desired output files directly,
i.e. in creates a temp. gnuplot file and runs this
(in combination with '-b', otherwise '-g' must be given).
Works only if format is ps or png ('-F').
usage_info
}
# variables
INPUT=""
OUTPUT=""
OUTPUT_PLOT=""
GNUPLOT=""
GNUPLOT_OPTIONS=""
HAS_OUTPUT="no"
HAS_GNUPLOT="no"
DELIMITER=","
TRANSPOSE="no"
XAXIS="no"
AVERAGE="no"
LINES="no"
TITLE="no"
FORMAT="x11"
WIDTH="800"
HEIGHT="600"
BATCH_FILES=""
BATCH_OPTIONS=""
EXECUTE="no"
# interprete parameters
while getopts ":hi:o:g:d:txalTF:W:H:O:b:eG:" flag
do
case $flag in
i) INPUT=$OPTARG
;;
o) OUTPUT=$OPTARG
HAS_OUTPUT="yes"
;;
g) GNUPLOT=$OPTARG
HAS_GNUPLOT="yes"
;;
G) GNUPLOT_OPTIONS=$OPTARG
BATCH_OPTIONS="$BATCH_OPTIONS -$flag $OPTARG"
;;
d) DELIMITER=$OPTARG
;;
t) TRANSPOSE="yes"
BATCH_OPTIONS="$BATCH_OPTIONS -$flag"
;;
x) XAXIS="yes"
BATCH_OPTIONS="$BATCH_OPTIONS -$flag"
;;
a) AVERAGE="yes"
BATCH_OPTIONS="$BATCH_OPTIONS -$flag"
;;
l) LINES="yes"
BATCH_OPTIONS="$BATCH_OPTIONS -$flag"
;;
T) TITLE="yes"
BATCH_OPTIONS="$BATCH_OPTIONS -$flag"
;;
O) OUTPUT_PLOT=$OPTARG
;;
W) WIDTH=$OPTARG
BATCH_OPTIONS="$BATCH_OPTIONS -$flag $OPTARG"
;;
H) HEIGHT=$OPTARG
BATCH_OPTIONS="$BATCH_OPTIONS -$flag $OPTARG"
;;
F) FORMAT=$OPTARG
BATCH_OPTIONS="$BATCH_OPTIONS -$flag $OPTARG"
;;
b) BATCH_FILES=$OPTARG
;;
e) EXECUTE="yes"
BATCH_OPTIONS="$BATCH_OPTIONS -$flag"
;;
h) usage
exit 0
;;
*) echo
echo "Unknown option: '-$OPTARG'"
echo
usage
exit 1
;;
esac
done
# valid combinations of parameters?
if [ ! "$BATCH_FILES" = "" ] && [ "$EXECUTE" = "yes" ] && [ "$FORMAT" = "x11" ]
then
echo
echo "ERROR: a format other than '$FORMAT' must be specified if '-b' and"
echo " '-e' are specified, e.g. 'ps'."
echo
usage
exit 2
fi
# batch-mode?
if [ ! "$BATCH_FILES" = "" ]
then
for i in $BATCH_FILES
do
echo "$i..."
# build options
OPTIONS=$BATCH_OPTIONS
OPTIONS="$OPTIONS -i $i"
OPTIONS="$OPTIONS -o $i.dat"
if [ "$HAS_GNUPLOT" = "yes" ]
then
OPTIONS="$OPTIONS -g $i.scr"
fi
if [ "$FORMAT" = "png" ]
then
OPTIONS="$OPTIONS -O $i.png"
fi
if [ "$FORMAT" = "ps" ]
then
OPTIONS="$OPTIONS -O $i.ps"
fi
# run script
$0 $OPTIONS
done
exit 0
fi
# test files
if [ ! "$INPUT" = "" ] && [ ! -f "$INPUT" ]
then
INPUT=""
fi
if [ ! "$GNUPLOT_OPTIONS" = "" ] && [ ! -f "$GNUPLOT_OPTIONS" ]
then
echo "Warning: '$GNUPLOT_OPTIONS' not found - ignored!"
GNUPLOT_OPTIONS=""
fi
if [ "$HAS_OUTPUT" = "no" ]
then
OUTPUT=$INPUT".tmp"
fi
# everything provided?
if [ "$INPUT" = "" ] || [ "$DELIMITER" = "" ]
then
echo
echo "ERROR: not all parameters provided or incorrect!"
echo
usage
exit 1
fi
if [ "$EXECUTE" = "yes" ] && [ "$HAS_GNUPLOT" = "no" ]
then
echo
echo "ERROR: '-g' must be specified with option '-e'!"
echo
usage
exit 3
fi
if [ "$OUTPUT_PLOT" = "" ] && [ ! "$FORMAT" = "x11" ]
then
echo "Warning: output file for format '$FORMAT' not specified, falling back to 'x11'"
FORMAT="x11"
fi
# some variables
TMPFILE=$OUTPUT".tmp"
# init
cp $INPUT $OUTPUT
# change modifier into " "
if [ ! "$DELIMITER" = " " ]
then
cat $OUTPUT | sed s/$DELIMITER/" "/g > $TMPFILE
cp $TMPFILE $OUTPUT
fi
# transpose matrix?
if [ "$TRANSPOSE" = "yes" ]
then
cat $OUTPUT | exec awk '
NR == 1 {
n = NF
for (i = 1; i <= NF; i++)
row[i] = $i
next
}
{
if (NF > n)
n = NF
for (i = 1; i <= NF; i++)
row[i] = row[i] " " $i
}
END {
for (i = 1; i <= n; i++)
print row[i]
}' > $TMPFILE
cp $TMPFILE $OUTPUT
fi
# average columns?
if [ "$AVERAGE" = "yes" ]
then
COLCOUNT=`head -n1 $OUTPUT | wc -w | sed s/" "*//g`
ROWCOUNT=`cat $OUTPUT | wc -l | sed s/" "*//g`
rm -f $TMPFILE
for ((i = 1; i <= $COLCOUNT; i++))
do
COL=`cat $OUTPUT | cut -f$i -d" "`
# average
TMP="("`echo $COL | sed s/" "/+/g`")/$ROWCOUNT"
if [ $i -gt 1 ]
then
echo -n " " >> $TMPFILE
fi
TMP=`echo "scale=4; $TMP" | bc -l`
echo -n $TMP >> $TMPFILE
# stddev
echo -n " " >> $TMPFILE
TMP="sqrt(($ROWCOUNT * ("`echo $COL | sed s/" "/"^2+"/g | sed s/$/"^2"/g`") - ("`echo $COL | sed s/" "/"+"/g`")^2) / ($ROWCOUNT * ($ROWCOUNT - 1)))"
TMP=`echo "scale=4; $TMP" | bc -l`
echo -n $TMP >> $TMPFILE
done
echo >> $TMPFILE
cp $TMPFILE $OUTPUT
fi
# add x-axis?
if [ "$XAXIS" = "yes" ]
then
cat $OUTPUT | grep -n "." | sed s/":"/" "/g > $TMPFILE
cp $TMPFILE $OUTPUT
fi
# gnuplot script?
if [ "$HAS_GNUPLOT" = "yes" ]
then
# data columns
COUNT=`head -n1 $OUTPUT | wc -w | sed s/" "*//g`
# build output/format statement
TERM="set terminal X11"
OUT="set output"
if [ "$FORMAT" = "png" ]
then
TERM="set terminal png size $WIDTH,$HEIGHT"
OUT="set output \"$OUTPUT_PLOT\""
fi
if [ "$FORMAT" = "ps" ]
then
TERM="set terminal postscript"
OUT="set output \"$OUTPUT_PLOT\""
fi
# build "with" statement
TMP=""
WITH=""
if [ "$LINES" = "yes" ]
then
TMP=$TMP" lines"
fi
if [ "$TITLE" = "yes" ]
then
TMP=$TMP" title #"
fi
if [ ! "$TMP" = "" ]
then
WITH=" with"$TMP
fi
# init
echo "# gnuplot script for '$OUTPUT'" > $GNUPLOT
if [ ! "$GNUPLOT_OPTIONS" = "" ]
then
cat $GNUPLOT_OPTIONS >> $GNUPLOT
fi
# the plots
echo "plot \"$OUTPUT\" using 1:2 `echo $WITH | sed s/"#"/"\'1\'"/g`" >> $GNUPLOT
for ((i = 2; i < $COUNT; i++))
do
echo "replot \"$OUTPUT\" using 1:$((i+1)) `echo $WITH | sed s/"#"/"\'$i\'"/g`" >> $GNUPLOT
done
echo >> $GNUPLOT
# only pause if displayed in window
if [ "$FORMAT" = "x11" ]
then
echo "pause -1" >> $GNUPLOT
else
echo "$TERM" >> $GNUPLOT
echo "$OUT" >> $GNUPLOT
echo "replot" >> $GNUPLOT
fi
# run gnuplot
if [ "$EXECUTE" = "yes" ]
then
if [ "$FORMAT" = "x11" ]
then
echo "Press <Return> to close window..."
fi
gnuplot "$GNUPLOT"
fi
fi
# clean up
rm -f $TMPFILE
if [ "$HAS_OUTPUT" = "no" ]
then
cat $OUTPUT
rm -f $OUTPUT
fi