File: simple.c

package info (click to toggle)
zsv 1.3.0-4
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 49,168 kB
  • sloc: ansic: 175,811; cpp: 56,301; sh: 3,635; makefile: 3,049; javascript: 577; cs: 90; awk: 70; python: 41; sql: 15
file content (123 lines) | stat: -rw-r--r-- 3,375 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
#include <stdio.h>
#include <string.h>
#include <zsv.h>

/**
 * Simple example using libzsv to call a row handler after each row is parsed
 *
 * In this super simple example, we will use libzsv to parse a CSV file
 * and call our custom row handler after each row is parsed. Our row handler
 * will check each cell in the row to determine if it is blank, and output
 * the row number, the total number of cells and the number of blank cells
 *
 * Example:
 *   `echo 'abc,def\nghi,,,' | build/simple -`
 * Outputs:
 *   Row 1 has 2 columns of which 0 are non-blank
 *   Row 2 has 4 columns of which 3 are non-blank
 */

/**
 * First, we define a structure that will contain all the information that
 * our row handler will need
 */
struct my_data {
  zsv_parser parser; /* used to access the parsed data */
  size_t row_num;    /* used to track the current row number */
};

/**
 * Our row handler is passed a pointer to our structure
 */
void my_row_handler(void *ctx) {
  struct my_data *data = ctx;

  /* get a cell count */
  size_t cell_count = zsv_cell_count(data->parser);

  /* iterate through each cell in this row, to count blanks */
  size_t nonblank = 0;
  for (size_t i = 0; i < cell_count; i++) {
    /* use zsv_get_cell() to get our cell data */
    struct zsv_cell c = zsv_get_cell(data->parser, i);

    /* check if the cell data length is zero */
    if (c.len > 0)
      nonblank++;
  }

  /* print our results for this row */
  printf("Row %zu has %zu columns of which %zu %s non-blank\n", ++data->row_num, cell_count, nonblank,
         nonblank == 1 ? "is" : "are");
}

/**
 * Main routine. Our program will take a single argument (a file name, or -)
 * and output, for each row, the numbers of total and blank cells
 */
int main(int argc, const char *argv[]) {

  /**
   * Process our arguments; output usage and/or errors if appropriate
   */
  if (argc != 2) {
    fprintf(stderr, "Reads a CSV file or stdin, and for each row,\n"
                    " output counts of total and blank cells\n");
    fprintf(stderr, "Usage: simple <filename or dash(-) for stdin>\n");
    fprintf(stderr,
            "Example:\n"
            "  echo \"A1,B1,C1\\nA2,B2,\\nA3,,C3\\n,,C3\" | %s -\n\n",
            argv[0]);
    return 0;
  }

  FILE *f = strcmp(argv[1], "-") ? fopen(argv[1], "rb") : stdin;
  if (!f) {
    perror(argv[1]);
    return 1;
  }

  /**
   * Configure our parser options. Here, all we do is specify our row handler
   * and the pointer that will be passed to our row handler. There are many
   * other options to control the parser behavior (CSV vs TSV vs other
   * delimited; header row span etc)-- for details, see
   * ../../include/zsv/api.h
   */
  struct zsv_opts opts = {0};
  opts.row_handler = my_row_handler;
  struct my_data data = {0};
  opts.ctx = &data;
  opts.stream = f;

  /**
   * Create a parser
   */
  data.parser = zsv_new(&opts);

  /**
   * Continuously parse our input until we have no more input
   */
  enum zsv_status stat;
  while ((stat = zsv_parse_more(data.parser)) == zsv_status_ok)
    ;

  /**
   * Clean up
   */
  zsv_finish(data.parser);
  zsv_delete(data.parser);

  if (f != stdin)
    fclose(f);

  /**
   * If there was a parse error, print it
   */
  if (stat != zsv_status_no_more_input) {
    fprintf(stderr, "Parse error: %s\n", zsv_parse_status_desc(stat));
    return 1;
  }

  return 0;
}