Chitrank-Dixit · October 7, 2022 16:40
diff --git a/lexical_analyser.py b/lexical_analyser.py
 # The Following Program would work as Lexical Analyser
 #
 # Write a C/C++ program which reads a program written
 # in any programming language (say C/C++/Java) and then perform 
 # lexical analysis. The output of program should contain the 
 # tokens i.e. classification as identifier, special symbol, delimiter, 
 # operator, keyword or string. It should also display the number of 
 # identifiers, special symbol, delimiter, operator, keyword, strings 
 # and statements

 ##############################################
 #  Input C Program
 ##############################################
 ##############################################
 # // Made for Lexical Analysis
 # /* Program as Input for LabAssignent3 */
 # /**/
 # #include <stdio.h> // This is a header file
 # int main()
 # {
 #     int a;
 #     a = 10;
 #     printf("The value of a is %d ",a);
 #     return 0;
 # }
 ##############################################







 import re

 f = open('InputProg.c','r')

 operators = { '=': 'Assignment Operator','+': 'Additon Operator', '-' : 'Substraction Operator', '/' : 'Division Operator', '*': 'Multiplication Operator', '++' : 'increment Operator', '--' : 'Decrement Operator'}
 optr_keys = operators.keys()

 comments = {r'//' : 'Single Line Comment',r'/*' : 'Multiline Comment Start', r'*/' : 'Multiline Comment End', '/**/' : 'Empty Multiline comment'}
 comment_keys = comments.keys()

 header = {'.h': 'header file'}
 header_keys = header.keys()

 sp_header_files = {'<stdio.h>':'Standard Input Output Header','<string.h>':'String Manipulation Library'}

 macros = {r'#\w+' : 'macro'}
 macros_keys = macros.keys()

 datatype = {'int': 'Integer','float' : 'Floating Point', 'char': 'Character','long': 'long int'}
 datatype_keys = datatype.keys()

 keyword = {'return' : 'keyword that returns a value from a block'}
 keyword_keys = keyword.keys()

 delimiter = {';':'terminator symbol semicolon (;)'}
 delimiter_keys = delimiter.keys()

 blocks = {'{' : 'Blocked Statement Body Open', '}':'Blocked Statement Body Closed'}
 block_keys = blocks.keys()

 builtin_functions = {'printf':'printf prints its argument on the console'}

 non_identifiers = ['_','-','+','/','*','`','~','!','@','#','$','%','^','&','*','(',')','=','|','"',':',';','{'
 ,'}','[',']','<','>','?','/']

 numerals = ['0','1','2','3','4','5','6','7','8','9','10']

 # Flags
 dataFlag = False


 i = f.read()

 count = 0
 program =  i.split('\n')

 for line in program:
    count = count+1
    print "Line #",count,"\n",line
    
     
    tokens = line.split(' ')
    print "Tokens are",tokens
    print "Line #",count,'properties \n'
    for token in tokens:
        
        if '\r' in token:
            position = token.find('\r')
            token=token[:position]
        # print 1
        
        if token in block_keys:
            print blocks[token]
        if token in optr_keys:
            print "Operator is: ", operators[token]
        if token in comment_keys:
            print "Comment Type: ", comments[token]
        if token in macros_keys:
            print "Macro is: ", macros[token]
        if '.h' in token:
            print "Header File is: ",token, sp_header_files[token]
        if '()' in token:
            print "Function named", token
        
        if dataFlag == True and (token not in non_identifiers) and ('()' not in token):
            print "Identifier: ",token
        if token in datatype_keys:
            print "type is: ", datatype[token]
            dataFlag = True
        
        if token in keyword_keys:
            print keyword[token]
            
        if token in delimiter:
            print "Delimiter" , delimiter[token]
        if '#' in token:
            match = re.search(r'#\w+', token)
            print "Header", match.group()
        if token in numerals:
            print token,type(int(token))
            
    dataFlag = False   
            
    
    print "________________________"
    

 f.close()
	# The Following Program would work as Lexical Analyser
	#
	# Write a C/C++ program which reads a program written
	# in any programming language (say C/C++/Java) and then perform
	# lexical analysis. The output of program should contain the
	# tokens i.e. classification as identifier, special symbol, delimiter,
	# operator, keyword or string. It should also display the number of
	# identifiers, special symbol, delimiter, operator, keyword, strings
	# and statements

	##############################################
	# Input C Program
	##############################################
	##############################################
	# // Made for Lexical Analysis
	# /* Program as Input for LabAssignent3 */
	# /**/
	# #include <stdio.h> // This is a header file
	# int main()
	# {
	# int a;
	# a = 10;
	# printf("The value of a is %d ",a);
	# return 0;
	# }
	##############################################







	import re

	f = open('InputProg.c','r')

	operators = { '=': 'Assignment Operator','+': 'Additon Operator', '-' : 'Substraction Operator', '/' : 'Division Operator', '*': 'Multiplication Operator', '++' : 'increment Operator', '--' : 'Decrement Operator'}
	optr_keys = operators.keys()

	comments = {r'//' : 'Single Line Comment',r'/' : 'Multiline Comment Start', r'/' : 'Multiline Comment End', '/**/' : 'Empty Multiline comment'}
	comment_keys = comments.keys()

	header = {'.h': 'header file'}
	header_keys = header.keys()

	sp_header_files = {'<stdio.h>':'Standard Input Output Header','<string.h>':'String Manipulation Library'}

	macros = {r'#\w+' : 'macro'}
	macros_keys = macros.keys()

	datatype = {'int': 'Integer','float' : 'Floating Point', 'char': 'Character','long': 'long int'}
	datatype_keys = datatype.keys()

	keyword = {'return' : 'keyword that returns a value from a block'}
	keyword_keys = keyword.keys()

	delimiter = {';':'terminator symbol semicolon (;)'}
	delimiter_keys = delimiter.keys()

	blocks = {'{' : 'Blocked Statement Body Open', '}':'Blocked Statement Body Closed'}
	block_keys = blocks.keys()

	builtin_functions = {'printf':'printf prints its argument on the console'}

	non_identifiers = ['_','-','+','/','','`','~','!','@','#','$','%','^','&','','(',')','=','\|','"',':',';','{'
	,'}','[',']','<','>','?','/']

	numerals = ['0','1','2','3','4','5','6','7','8','9','10']

	# Flags
	dataFlag = False


	i = f.read()

	count = 0
	program = i.split('\n')

	for line in program:
	count = count+1
	print "Line #",count,"\n",line


	tokens = line.split(' ')
	print "Tokens are",tokens
	print "Line #",count,'properties \n'
	for token in tokens:

	if '\r' in token:
	position = token.find('\r')
	token=token[:position]
	# print 1

	if token in block_keys:
	print blocks[token]
	if token in optr_keys:
	print "Operator is: ", operators[token]
	if token in comment_keys:
	print "Comment Type: ", comments[token]
	if token in macros_keys:
	print "Macro is: ", macros[token]
	if '.h' in token:
	print "Header File is: ",token, sp_header_files[token]
	if '()' in token:
	print "Function named", token

	if dataFlag == True and (token not in non_identifiers) and ('()' not in token):
	print "Identifier: ",token
	if token in datatype_keys:
	print "type is: ", datatype[token]
	dataFlag = True

	if token in keyword_keys:
	print keyword[token]

	if token in delimiter:
	print "Delimiter" , delimiter[token]
	if '#' in token:
	match = re.search(r'#\w+', token)
	print "Header", match.group()
	if token in numerals:
	print token,type(int(token))

	dataFlag = False


	print "________________________"


	f.close()