a. Have a scenario, where in my function reads in a file which contains list of c-structures as shown below, reads the file and extracts all the information between { } braces for each structure and store them in arrays.
package whatstruct;typedef struct packed {int [4:0] version;char party;float parity; char ccc; int [7:0] spend;} party_s;typedef struct packed {int [5:0] cod3;int [1:0] group;int [51:0] duty;char calloff; char selfi;int [11:0] snap; int [5:0] longtrip;int [1:0] whattodo;int [9:0] sky;int [7:0] yahoo;int [5:0] hurrey;int [3:0] appology;int [1:0] temp;int [2:0] iddd; float dontknow; } dict_s;typedef struct packed {int [4:0] jan;int [12:0] feb;int [1:0] mar;logic mar; logic april; } months_c;typedef struct packed {var apple;int mango;float banana;int lichi} fruits_s;
endpackage: whatstruct
b. The functions reads in two parameters, one is the file containing the structures and the second parameter contains list of struct names only from which the lines needs to be extracted. For extracting all the infos between {}, tried some of the examples available as given below.
from Tkinter import *
import subprocess
import shlex
import os
import time
import string
import threading
import sys, argparse
import ttk
import re
import logging
import warnings
import os.path
import gzipreadstructfile = None
filename = None
structnames = Nonedef readfileanddump(filename, structnames):readstructfile = open(filename, "r+")test_str = readstructfile.readlines() matches = re.finditer(r"\{(.*?)\}", str(test_str), re.MULTILINE | re.DOTALL)for matchNum, match in enumerate(matches):for groupNum in range(0, len(match.groups())):print (match.group(1))# for lines in readstructfile:# print linesreadfileanddump("structpkg.c", all);
c. Was able to extract all the infos between {} and dumpout the infos if the second parameter is provided as "all". But if the second parameter passed is a string containing struct names, only those struct that needs to be extracted. I am unclear how to do that. Is it possible using regexp ? or any other way is better?
Any suggestion is highly helpful !
Updated CODE:
from Tkinter import *
import subprocess
import shlex
import os
import time
import string
import threading
import sys, argparse
import ttk
from openpyxl import Workbook, load_workbook
from openpyxl.compat import range
from openpyxl.utils import get_column_letter
from openpyxl.styles import Alignment, PatternFill, Border, Color
from openpyxl.styles.colors import YELLOW
from openpyxl.styles.borders import Border, Side
import re
import logging
import warnings
import os.path
import gzip#import xlwt
#import xlrd readstructfile = None
filename = None
structnames = []
filename_and_structnames_l = []
global found_struct
global found_struct_idxfound_struct_idx = {}
found_struct = 0def readfileanddump(filename_and_structnames):global found_structfilename_and_structnames_l = filename_and_structnames.split(",") if len(filename_and_structnames_l) < 2:filename = filename_and_structnames_l[0]structnames.append('all')print "1. Value of filename %s and structnames %s"%(filename, str(structnames))elif len(filename_and_structnames_l) > 1 and len(filename_and_structnames_l) < 3:filename = filename_and_structnames_l[0]structnames.append(filename_and_structnames_l[1])print "2. Value of filename %s and structnames %s"%(filename, str(structnames))elif len(filename_and_structnames_l) > 2: filename = filename_and_structnames_l[0]for i in range (1, len(filename_and_structnames_l)):structnames.append(filename_and_structnames_l[i])print "3. Value of filename %s and structnames %s"%(filename, str(structnames))if (len(structnames) == 1) and (structnames[0] == 'all'):readstructfile = open(filename, "r+")test_str = readstructfile.readlines() matches = re.finditer(r"\{(.*?)\}", str(test_str), re.MULTILINE | re.DOTALL)for matchNum, match in enumerate(matches):for groupNum in range(0, len(match.groups())):print (match.group(1))# match_group_t = str(str(re.sub('[A-Za-z0-9_[]:]+', '', str(match.group(1)))).strip())# match_group_t = match.groups(1)#for i in range (len(match_group_t)):# print match_group_t[i].replace("\n","")# print str(str(re.sub('[^A-Za-z0-9[:]]+[\r\n]+', ' ', str(match_group_t[i]))))# print re.sub(r"(?<=[a-z])\r?\n"," ", match_group_t[i]) # print ''.join(ch for ch in match_group_t[i] if not ch.isspace())# print ''.join(match_group_t[i].strip().split())#print(re.sub(r"(?:[;\n']|\s{2,})",r'',match_group_t[i])[2:])# print match_group_tprint(re.sub(r"(?:[;\n']|\s{2,})",r'',match.group(1))[2:])else:readstructfile = open(filename, "r+")for lines in readstructfile:if found_struct == 0 and re.match(r'.*typedef struct', lines):found_struct = 1matches = re.finditer(r"\{(.*?)\}.*", str(lines), re.MULTILINE | re.DOTALL)print "Value in matches", matchesif found_struct == 1 and re.match(r'.*}.*', lines):found_struct = 0found_struct_t = str(str(re.sub('[^A-Za-z0-9_]+', ' ', str(lines))).strip()).split(" ")for i in range (len(structnames)):if structnames[i] == found_struct_t[0]:# print "value of found_struct_t", found_struct_t# #found_struct_idx.append(found_struct_t[0]) # found_struct_idx[structnames[i]] = i # print "Value of found_struct_idx", found_struct_idx# breakprint "Value in found_struct_t", found_struct_t # for matchNum, match in enumerate(matches):# for groupNum in range(0, len(match.groups())):# print (match.group(1))readfileanddump('alldetailspkg');