pastebin - collaborative debugging tool
rovema.kpaste.net RSS


bootimage: config cpv test parser cpvparser1.c - test code for ksh93 compound variable parsing
Posted by Anonymous on Tue 21st Nov 2023 12:19
raw | new post
modification of post by Anonymous (view diff)

  1.  
  2. /*
  3.  * MIT License
  4.  *
  5.  * Copyright (c) 2023 Roland Mainz <roland.mainz@nrubsig.org>
  6.  *
  7.  * Permission is hereby granted, free of charge, to any person obtaining a copy
  8.  * of this software and associated documentation files (the "Software"), to deal
  9.  * in the Software without restriction, including without limitation the rights
  10.  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  11.  * copies of the Software, and to permit persons to whom the Software is
  12.  * furnished to do so, subject to the following conditions:
  13.  *
  14.  * The above copyright notice and this permission notice shall be included in all
  15.  * copies or substantial portions of the Software.
  16.  *
  17.  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  18.  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  19.  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  20.  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  21.  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  22.  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  23.  * SOFTWARE.
  24.  */
  25.  
  26. /*
  27.  * cpvparser1.c - simple ksh93 compound variable parsing
  28.  *
  29.  * It basically reads the output of $ print -v ... # like this:
  30.  * ---- snip ----
  31.  * $ ksh93 -c 'compound c=( va=1 vb=hello ) ; print -v c'
  32.  * (
  33.  *        va=1
  34.  *        vb=hello
  35.  * )
  36.  * ---- snip ----
  37.  *
  38.  * ToDo:
  39.  * - arrays (indexed, sparse indexed and associative)
  40.  * - multibyte characters
  41.  *
  42.  * Written by Roland Mainz <roland.mainz@nrubsig.org>
  43.  */
  44.  
  45. #include <stdlib.h>
  46. #include <stdbool.h>
  47. #include <string.h>
  48. #include <stdio.h>
  49. #include <ctype.h>
  50.  
  51. #include "cpvparser1.h"
  52.  
  53. /* private data! */
  54. typedef struct cpv_parse_context {
  55.         const char *start_string;
  56.         const char *curr_string;
  57.         size_t max_name_val_size;
  58.         unsigned long flags;
  59. } cpv_parse_context;
  60.  
  61.  
  62. void *cpv_create_parser(const char *s, unsigned long flags, ...)
  63. {
  64.         cpv_parse_context *cpc;
  65.        
  66.         cpc = calloc(1, sizeof(cpv_parse_context));
  67.         if (!cpc)
  68.                 goto fail;
  69.        
  70.         cpc->start_string = strdup(s);
  71.         if (!cpc->start_string)
  72.                 goto fail;
  73.  
  74.         cpc->curr_string = cpc->start_string;
  75.         cpc->max_name_val_size = strlen(cpc->start_string);
  76.         cpc->flags = flags;
  77.        
  78.         return (cpc);
  79.  
  80. fail:
  81.         if (cpc) {
  82.                 free((void *)cpc->start_string);
  83.                 free(cpc);
  84.         }
  85.  
  86.         return NULL;
  87. }
  88.  
  89. void cpv_free_parser(void *v_cpc)
  90. {
  91.         cpv_parse_context *cpc = (cpv_parse_context *)v_cpc;
  92.         if (cpc) {
  93.                 free((void *)cpc->start_string);
  94.                 free(cpc);
  95.         }
  96. }
  97.  
  98. int cpv_read_cpv_header(void *v_cpc)
  99. {
  100.         cpv_parse_context *cpc = (cpv_parse_context *)v_cpc;
  101.         const char *s = cpc->curr_string;
  102.  
  103. skipspaces:
  104.         while((*s != '\0') && isspace(*s))
  105.                 s++;
  106.  
  107.         /*
  108.          * skip POSIX-style '#' comments
  109.          * (allowed since this is based on POSIX sh(1) syntax)
  110.          */
  111.         if (*s == '#') {
  112.                 s++;
  113.                 /* ignore everything until the end-of-line */
  114.                 while((*s != '\0') && (*s != '\n'))
  115.                         s++;
  116.                 goto skipspaces;
  117.         }
  118.  
  119.         if (*s == '(') {
  120.                 cpc->curr_string=++s;
  121.                 if (cpc->flags & CPVFLAG_DEBUG_OUTPUT) {
  122.                         (void)fprintf(stderr, "cpv_read_cpv_header: begin-of-cpv\n");
  123.                 }
  124.                 return 0;
  125.         }
  126.  
  127.         if (cpc->flags & CPVFLAG_DEBUG_OUTPUT) {
  128.                 (void)fprintf(stderr, "cpv_read_cpv_header: end-of-string, should not happen\n");
  129.         }
  130.         return 1;
  131. }
  132.  
  133. int cpv_parse_name_val(void *v_cpc, cpv_name_val *cpv_nv)
  134. {
  135.         cpv_parse_context *cpc = (cpv_parse_context *)v_cpc;
  136.         char namebuff[cpc->max_name_val_size+1];
  137.         char valbuff[cpc->max_name_val_size+1];
  138.  
  139.         const char *s = cpc->curr_string;
  140.  
  141.         char *n; /* pointer in |namebuff| */
  142.         char *v; /* pointer in |valbuff| */
  143.  
  144. skipspaces:
  145.         while((*s != '\0') && isspace(*s))
  146.                 s++;
  147.  
  148.         /*
  149.          * skip POSIX-style '#' comments
  150.          * (allowed since this is based on POSIX sh(1) syntax)
  151.          */
  152.         if (*s == '#') {
  153.                 s++;
  154.                 /* ignore everything until the end-of-line */
  155.                 while((*s != '\0') && (*s != '\n'))
  156.                         s++;
  157.                 goto skipspaces;
  158.         }
  159.  
  160.         if (*s == '\0') {
  161.                 if (cpc->flags & CPVFLAG_DEBUG_OUTPUT) {
  162.                         (void)fprintf(stderr, "cpv_parse_name_val: "
  163.                                 "error: end-of-string, should not happen\n");
  164.                 }
  165.                 return 1;
  166.         }
  167.  
  168.         /* cpv == "( foo=bar blabla=text )"*/
  169.         if (*s == ')') {
  170.                 if (cpc->flags & CPVFLAG_DEBUG_OUTPUT) {
  171.                         (void)fprintf(stderr, "cpv_parse_name_val: end-of-cpv (OK)\n");
  172.                 }
  173.                 return 1;
  174.         }
  175.  
  176. parse_varname:
  177.         /*
  178.          * start parsing variable name
  179.          */
  180.  
  181.         /* variable names MUST start with a letter! */
  182.         if (!isalpha(*s)) {
  183.                 if (cpc->flags & CPVFLAG_DEBUG_OUTPUT) {
  184.                         (void)fprintf(stderr,
  185.                                 "cpv_parse_name_val: parser error, first char "
  186.                                 "in variable name not isalpha(c=%c)\n",
  187.                                 *s);
  188.                 }
  189.                 return 1;
  190.         }
  191.  
  192.         n = namebuff;
  193.         while((*s != '\0') && isalnum(*s))
  194.                 *n++ = *s++;
  195.         *n = '\0';
  196.  
  197.         /*
  198.          * skip typed member varables
  199.          * (e.g. "typeset ", "typeset -i ", "typeset -l -i2" etc.)
  200.          */
  201.         if (isspace(*s)) {
  202.                 if ((!strcmp(namebuff, "typeset")) ||
  203.                         (!strcmp(namebuff, "integer")) ||
  204.                         (!strcmp(namebuff, "float")) ||
  205.                         (!strcmp(namebuff, "compound"))) {
  206. skip_typeset_options:
  207.                         while(isspace(*s))
  208.                                 s++;
  209.                         if (*s == '-') {
  210.                                 s++;
  211.                                 while(isalnum(*s))
  212.                                         s++;
  213.                                 goto skip_typeset_options;
  214.                         }
  215.  
  216.                         goto parse_varname;
  217.                 }
  218.         }
  219.  
  220.         /* handle '=' */
  221.         if (*s != '=') {
  222.                 if (cpc->flags & CPVFLAG_DEBUG_OUTPUT) {
  223.                         (void)fprintf(stderr, "cpv_parse_name_val: "
  224.                                 "parser error, expected '=', got '%c'.\n",
  225.                                 *s);
  226.                 }
  227.                 return 1;
  228.         }
  229.  
  230.         s++; /* skip '=' */
  231.  
  232.         /*
  233.          * start parsing variable value
  234.          */
  235.         bool in_doublequotes=false;
  236.         bool in_singlequotes=false;
  237.         v = valbuff;
  238. val_quotes:
  239.         if (in_singlequotes) {
  240.                 while(*s != '\0') {
  241.                         if (*s == '\'') {
  242.                                 in_singlequotes = false;
  243.                                 s++;
  244.                                 goto val_quotes;
  245.                         }
  246.  
  247.                         if ((*s == '\\') && (*(s+1) != '\0')) {
  248.                                 /*
  249.                                  * fixme: should support \ooo octals,
  250.                                  * \u[hex] unicode and \w[hex] wchar
  251.                                  */
  252.                                 s++;
  253.                         }
  254.                         *v++ = *s++;
  255.                 }
  256.         }
  257.         else if (in_doublequotes) {
  258.                 while(*s != '\0') {
  259.                         if (*s == '"') {
  260.                                 in_doublequotes = false;
  261.                                 s++;
  262.                                 goto val_quotes;
  263.                         }
  264.  
  265.                         if ((*s == '\\') && (*(s+1) != '\0')) {
  266.                                 /*
  267.                                  * fixme: should support \ooo octals,
  268.                                  * \u[hex] unicode and \w[hex] wchar
  269.                                  */
  270.                                 s++;
  271.                         }
  272.  
  273.                         *v++ = *s++;
  274.                 }
  275.         }
  276.         else
  277.         {
  278.                 while((*s != '\0') && (!isspace(*s))) {
  279.                         if (*s == '"') {
  280.                                 in_doublequotes = true;
  281.                                 s++;
  282.                                 goto val_quotes;
  283.                         }
  284.  
  285.                         if (*s == '\'') {
  286.                                 in_singlequotes = true;
  287.                                 s++;
  288.                                 goto val_quotes;
  289.                         }
  290.  
  291.                         if ((*s == '\\') && (*(s+1) != '\0')) {
  292.                                 /*
  293.                                  * fixme: should support \ooo octals,
  294.                                  * \u[hex] unicode and \w[hex] wchar
  295.                                  */
  296.                                 s++;
  297.                         }
  298.                         *v++ = *s++;
  299.                 }
  300.         }
  301.  
  302.         if (in_singlequotes) {
  303.                 if (cpc->flags & CPVFLAG_DEBUG_OUTPUT) {
  304.                         (void)fprintf(stderr, "cpv_parse_name_val: "
  305.                                 "parsererror, still in single quotes "
  306.                                 "at the end\n");
  307.                 }
  308.                 return 1;
  309.         }
  310.         if (in_doublequotes) {
  311.                 if (cpc->flags & CPVFLAG_DEBUG_OUTPUT) {
  312.                         (void)fprintf(stderr, "cpv_parse_name_val: "
  313.                                 "parser error, still in double quotes "
  314.                                 "at the end\n");
  315.                 }
  316.                 return 1;
  317.         }
  318.  
  319.         *v = '\0';
  320.  
  321. #if 0
  322.         (void)printf("cpv_parse_name_val: name='%s', value='%s'\n",
  323.                 namebuff, valbuff);
  324. #endif
  325.  
  326.         cpv_nv->cpv_name   = strdup(namebuff);
  327.         cpv_nv->cpv_value  = strdup(valbuff);
  328.  
  329.         if ((cpv_nv->cpv_name == NULL) || (cpv_nv->cpv_value == NULL)) {
  330.                 cpv_free_name_val_data(cpv_nv);
  331.                 if (cpc->flags & CPVFLAG_DEBUG_OUTPUT) {
  332.                         (void)fprintf(stderr, "cpv_parse_name_val: "
  333.                                 "parser error, out of memory\n");
  334.                 }
  335.                 return 2;
  336.         }
  337.  
  338.         cpc->curr_string = s;
  339.  
  340.         return 0;
  341. }
  342.  
  343. void cpv_free_name_val_data(cpv_name_val *cnv)
  344. {
  345.         if (!cnv)
  346.                 return;
  347.  
  348.         free((void *)cnv->cpv_name);
  349.         free((void *)cnv->cpv_value);
  350.         cnv->cpv_name = NULL;
  351.         cnv->cpv_value = NULL;
  352. }
  353. /*
  354.  * MIT License
  355.  *
  356.  * Copyright (c) 2023 Roland Mainz <roland.mainz@nrubsig.org>
  357.  *
  358.  * Permission is hereby granted, free of charge, to any person obtaining a copy
  359.  * of this software and associated documentation files (the "Software"), to deal
  360.  * in the Software without restriction, including without limitation the rights
  361.  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  362.  * copies of the Software, and to permit persons to whom the Software is
  363.  * furnished to do so, subject to the following conditions:
  364.  *
  365.  * The above copyright notice and this permission notice shall be included in all
  366.  * copies or substantial portions of the Software.
  367.  *
  368.  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  369.  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  370.  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  371.  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  372.  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  373.  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  374.  * SOFTWARE.
  375.  */
  376.  
  377. /*
  378.  * cpvparser1.c - simple ksh93 compound variable parsing
  379.  *
  380.  * It basically reads the output of $ print -v ... # like this:
  381.  * ---- snip ----
  382.  * $ ksh93 -c 'compound c=( va=1 vb=hello ) ; print -v c'
  383.  * (
  384.  *        va=1
  385.  *        vb=hello
  386.  * )
  387.  * ---- snip ----
  388.  *
  389.  * ToDo:
  390.  * - arrays (indexed, sparse indexed and associative)
  391.  * - multibyte characters
  392.  *
  393.  * Written by Roland Mainz <roland.mainz@nrubsig.org>
  394.  */
  395.  
  396. #include <stdlib.h>
  397. #include <stdbool.h>
  398. #include <string.h>
  399. #include <stdio.h>
  400. #include <ctype.h>
  401.  
  402. #include "cpvparser1.h"
  403.  
  404. /*
  405.  * Compile with:
  406.  * $ gcc -Wall -g cpvparser1.c  main.c -o cpvparser1
  407.  *
  408.  * Example usage:
  409.  * ./cpvparser1 "$(ksh -c 'compound c ; typeset c.s="hello" ; print -v c')"
  410.  */
  411. int main(int ac, char *av[])
  412. {
  413.         const char *str =
  414.                 " ( \n"
  415.                 "x=y1 chicken=wing xchicken=w\\\"ing qcount=\"one two\" sq1='foo \" x \" bar'"
  416.                 "\n  # a comment x=y\n"
  417.                 "\n"
  418.                 " \n"
  419.                 "\t\n"
  420.                 "emptyval= \n"
  421.                 "emptyval2=\n"
  422.                 "emptyval3=''\n"
  423.                 " emptyval4="" \n"
  424.                 "aftercomment=yep\n"
  425.                 "typeset -i2 bintypedvar=1010\n"
  426.                 "typeset  -u  strtypedvar=UAUA\n"
  427.                 "integer lastvar=666 \n"
  428.                 "\n)";
  429.         int numcnv = 0;
  430.         int i = 0;
  431.         cpv_name_val cnv[256];
  432.         void *c;
  433.  
  434.         if (ac == 2) {
  435.                 (void)fputs("# parsing av[1] ...\n", stderr);
  436.                 c = cpv_create_parser(av[1], 0);
  437.         }
  438.         else {
  439.                 (void)fputs("# parsing builtin test string ...\n", stderr);
  440.                 c = cpv_create_parser(str, 0);
  441.         }
  442.  
  443.         if (!c) {
  444.                 (void)fprintf(stderr, "cpv_create_parser: no memory\n");
  445.                 return EXIT_FAILURE;
  446.         }
  447.  
  448.         if (cpv_read_cpv_header(c)) {
  449.                 (void)fprintf(stderr, "cpv_read_cpv_header failed\n");
  450.                 return EXIT_FAILURE;
  451.         }
  452.  
  453.         for (numcnv=0 ; cpv_parse_name_val(c, &cnv[numcnv]) == 0 ; numcnv++) {
  454.         }
  455.  
  456.         (void)fputs("# data:\n", stderr);
  457.         for (i=0 ; i < numcnv ; i++) {
  458.                 (void)printf("name='%s', value='%s'\n", cnv[i].cpv_name, cnv[i].cpv_value);
  459.         }
  460.  
  461.         (void)fputs("# free memory ...\n", stderr);
  462.         for (i=0 ; i < numcnv ; i++) {
  463.                 cpv_free_name_val_data(&cnv[i]);
  464.         }
  465.        
  466.         cpv_free_parser(c);
  467.  
  468.         (void)fputs("# done.\n", stderr);
  469.  
  470.         return EXIT_SUCCESS;
  471. }
  472.  
  473. /*
  474.  * MIT License
  475.  *
  476.  * Copyright (c) 2023 Roland Mainz <roland.mainz@nrubsig.org>
  477.  *
  478.  * Permission is hereby granted, free of charge, to any person obtaining a copy
  479.  * of this software and associated documentation files (the "Software"), to deal
  480.  * in the Software without restriction, including without limitation the rights
  481.  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  482.  * copies of the Software, and to permit persons to whom the Software is
  483.  * furnished to do so, subject to the following conditions:
  484.  *
  485.  * The above copyright notice and this permission notice shall be included in all
  486.  * copies or substantial portions of the Software.
  487.  *
  488.  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  489.  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  490.  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  491.  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  492.  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  493.  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  494.  * SOFTWARE.
  495.  */
  496.  
  497. /*
  498.  * cpvparser1.h - simple ksh93 compound variable parsing
  499.  *
  500.  * It basically reads the output of $ print -v ... # like this:
  501.  * ---- snip ----
  502.  * $ ksh93 -c 'compound c=( va=1 vb=hello ) ; print -v c'
  503.  * (
  504.  *        va=1
  505.  *        vb=hello
  506.  * )
  507.  * ---- snip ----
  508.  *
  509.  * ToDo:
  510.  * - arrays (indexed, sparse indexed and associative)
  511.  * - multibyte characters
  512.  *
  513.  * Written by Roland Mainz <roland.mainz@nrubsig.org>
  514.  */
  515.  
  516. #ifndef CPV_PARSER_H
  517. #define CPV_PARSER_H 1
  518.  
  519. typedef struct cpv_name_val
  520. {
  521.         const char *cpv_name;
  522.         const char *cpv_value;
  523. } cpv_name_val;
  524.  
  525. /* Flags for |cpv_create_parser()| */
  526. #define CPVFLAG_DEBUG_OUTPUT (0x00000008L)
  527.  
  528. /* prototypes */
  529. void *cpv_create_parser(const char *s, unsigned long flags, ...);
  530. void cpv_free_parser(void *);
  531. int cpv_read_cpv_header(void *);
  532. void cpv_free_name_val_data(cpv_name_val *);
  533. int cpv_parse_name_val(void *, cpv_name_val *);
  534.  
  535. #endif /* !CPV_PARSER_H */

Submit a correction or amendment below (click here to make a fresh posting)
After submitting an amendment, you'll be able to view the differences between the old and new posts easily.

Syntax highlighting:

To highlight particular lines, prefix each line with {%HIGHLIGHT}




All content is user-submitted.
The administrators of this site (kpaste.net) are not responsible for their content.
Abuse reports should be emailed to us at