1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108
|
# Copyright(c) 1986 Association of Universities for Research in Astronomy Inc.
include <mach.h>
# SPLIT -- Split a large file up into more manageable pieces. If the operand
# is a text file, split the file into segments of at most NLINES lines, else
# if the file is a binary file, split it into segments of at most NBYTES bytes.
# Only a single input file can be processed.
procedure t_split()
long offset
bool verbose
pointer sp, input, output, fname, buf
int maxfiles, nchars, nlines, nbytes
int file_type, nrecords, fileno, in, out, n
bool clgetb()
int open(), read(), getline(), access(), clgeti()
begin
call smark (sp)
call salloc (input, SZ_FNAME, TY_CHAR)
call salloc (output, SZ_FNAME, TY_CHAR)
call salloc (fname, SZ_FNAME, TY_CHAR)
# Get the input file name and the root name for the output files.
call clgstr ("input", Memc[input], SZ_FNAME)
call clgstr ("output", Memc[output], SZ_FNAME)
# Determine the file type of the input file.
if (access (Memc[input], READ_ONLY, TEXT_FILE) == YES)
file_type = TEXT_FILE
else
file_type = BINARY_FILE
# Determine the segment size and allocate the data buffer.
if (file_type == TEXT_FILE) {
nlines = clgeti ("nlines")
call salloc (buf, SZ_LINE, TY_CHAR)
} else {
nbytes = clgeti ("nbytes")
nchars = (nbytes + SZB_CHAR-1) / SZB_CHAR
call salloc (buf, nchars, TY_CHAR)
}
maxfiles = clgeti ("maxfiles")
verbose = clgetb ("verbose")
# Split the input file.
in = open (Memc[input], READ_ONLY, file_type)
offset = 1
for (fileno=1; fileno <= maxfiles; fileno=fileno+1) {
# Open the next segment file.
call sprintf (Memc[fname], SZ_FNAME, "%s.%0*d")
call pargstr (Memc[output])
call pargi (int (log10(real(maxfiles))) + 1)
call pargi (fileno)
if (verbose) {
call printf ("%s: ")
call pargstr (Memc[fname])
call flush (STDOUT)
}
out = open (Memc[fname], NEW_FILE, file_type)
# Copy the segment.
if (file_type == BINARY_FILE) {
n = read (in, Memc[buf], nchars)
if (n != EOF) {
call write (out, Memc[buf], n)
nrecords = n
} else
nrecords = 0
} else {
for (nrecords=0; nrecords < nlines; nrecords=nrecords+1)
if (getline (in, Memc[buf]) == EOF)
break
else
call putline (out, Memc[buf])
}
# Close the file; delete it and exit if no data was written.
call close (out)
if (nrecords <= 0) {
if (verbose)
call printf ("[deleted; exit]\n")
call delete (Memc[fname])
break
} else if (verbose) {
call printf ("%d %s @ %d\n")
if (file_type == TEXT_FILE) {
call pargi (nrecords)
call pargstr ("lines")
} else {
call pargi (nrecords * SZB_CHAR)
call pargstr ("bytes")
}
call pargi (offset)
}
offset = offset + nrecords
call flush (STDOUT)
}
call sfree (sp)
end
|