编译原理预测分析表自顶向下的语法分析实现

递归下降

递归子程序方法的思路：递归子程序法是一种确定的自顶向下语法分析方法，要求文法是LL(1)文法。它的实现思想是对应文法中每个非终结符编写一个递归过程，每个过程的功能是识别由该非终结符推出的串，当某非终结符的产生式有多个候选式时能够按LL(1)形式唯一地确定选择某个候选式进行推导。

具体请看：

递归下降实现LL(1)文法分析C语言与Python实现

预测分析表

预测分析方法的思路：预测分析法是一种表驱动的方法，它由下推栈，预测分析表和控制程序组成。实际上是一种下推自动机的实现模型。预测分析法的关键为预测分析表的构建，即文法中各非终结符first集和follow集的求得。预测分析法从开始符号开始，根据当前句型的最左边的非终结符和分析串中的当前符号，查预测分析表确定下一步推导所要选择的产生式，最终得到输入串的最左推导，完成输入串的语法检查。

流程图

Python代码

import time
import wx
import wx.grid

FIRST = dict()  # FIRST集
FOLLOW = dict()  # FOLLOW集
Grammar = dict()  # 文法
LL1Table = dict()  # 分析表
VT = set()  # 终结符
ProcessList = dict()


def get_lan():
    num = int(input('请输入文法的个数：'))
    for i in range(num):
        temp = input()
        splitlist = temp[3:].replace("\n", "").split("|")
        Grammar[temp[0]] = splitlist


def get_first():
    for k in Grammar:
        l = Grammar[k]
        FIRST[k] = list()
        for s in l:
            if not (s[0].isupper()):
                FIRST[k].append(s[0])
    for i in range(2):
        for k in Grammar:
            l = Grammar[k]
            for s in l:
                if (s[0].isupper()):
                    FIRST[k].extend(FIRST[s[0]])
                    FIRST[k] = list(set(FIRST[k]))  # 去重
    print("文法为：%s" % Grammar)
    print("FIRST集为：%s" % FIRST)


def get_follow():
    condition = lambda t: t != '~'  # 过滤器用于过滤空串
    for k in Grammar:  # 新建list
        FOLLOW[k] = list()
        if k == list(Grammar.keys())[0]:
            FOLLOW[k].append('#')
    for i in range(2):
        for k in Grammar:
            l = Grammar[k]
            for s in l:
                if s[len(s) - 1].isupper():
                    FOLLOW[s[len(s) - 1]].extend(FOLLOW[k])  # 若A→αB是一个产生式，则把FOLLOW(A)加至FOLLOW(B)中
                    FOLLOW[s[len(s) - 1]] = list(filter(condition, FOLLOW[s[len(s) - 1]]))  # 去除空串
                for index in range(len(s) - 1):
                    if s[index].isupper():
                        if s[index + 1].isupper():  # 若A→αBβ是一个产生式，则把FIRST(β)\{ε}加至FOLLOW(B)中；
                            FOLLOW[s[index]].extend(FIRST[s[index + 1]])
                            FOLLOW[s[index]] = list(filter(condition, FOLLOW[s[index]]))  # 去除空串
                        if not (s[index + 1].isupper()) and (s[index + 1] != '~'):
                            FOLLOW[s[index]].append(s[index + 1])
                        emptyflag = 1
                        for i in range(index + 1, len(s)):
                            if not (s[i].isupper()) or (s[i].isupper() & ('~' not in FIRST[s[i]])):
                                emptyflag = 0
                                break
                        if emptyflag == 1:
                            FOLLOW[s[index]].extend(FOLLOW[k])  # A→αBβ是一个产生式而(即ε属于FIRST(β))，则把FOLLOW(A)加至FOLLOW(B)中
                            FOLLOW[s[index]] = list(filter(condition, FOLLOW[s[index]]))  # 去除空串
    for k in FOLLOW:  # 去重
        FOLLOW[k] = list(set(FOLLOW[k]))
    print('FOLLOW集为：%s' % FOLLOW)


def get_VT():
    VT.add('#')
    for l in Grammar.values():
        for s in l:
            for c in s:
                if not (c.isupper()) and (c != '~'): VT.add(c)
    print('终结符为：%s' % VT)


def generate_table():
    get_VT()
    for k in Grammar:  # 初始化分析表
        LL1Table[k] = dict()
        for e in VT:
            LL1Table[k][e] = None
    for k in Grammar:
        l = Grammar[k]
        for s in l:
            if s[0].isupper():
                for e in VT:
                    if e in FIRST[s[0]]: LL1Table[k][e] = s
            if s[0] in VT:
                LL1Table[k][s[0]] = s
            if (s[0].isupper() and ('~' in FIRST[s[0]])) or (s == '~'):
                for c in FOLLOW[k]:
                    LL1Table[k][c] = s
    print('分析表为：%s' % LL1Table)


class GridFrame(wx.Frame):
    def __init__(self, parent):
        global LR0TABLE

        wx.Frame.__init__(self, parent)

        # Create a wxGrid object
        grid = wx.grid.Grid(self, -1)

        # Then we call CreateGrid to set the dimensions of the grid
        # (100 rows and 10 columns in this example)
        grid.CreateGrid(len(list(LL1Table)) + 1, len(VT) + 1)

        # We can set the sizes of individual rows and columns
        # in pixels

        grid.SetCellValue(1, 0, 'E')
        grid.SetCellValue(2, 0, 'M')
        grid.SetCellValue(3, 0, 'T')
        grid.SetCellValue(4, 0, 'N')
        grid.SetCellValue(5, 0, 'F')

        VTList = list(VT)
        VTList.sort(reverse=True)
        for i in range(len(list(VT))):
            grid.SetCellValue(0, i+1, list(VTList)[i])

        for i in range(len(list(LL1Table))):
            for j in range(len(list(VT))):
                if str(LL1Table[grid.GetCellValue(i + 1, 0)][grid.GetCellValue(0, j + 1)]) != 'None':
                    grid.SetCellValue(i + 1, j + 1, '->' + str(LL1Table[grid.GetCellValue(i + 1, 0)][grid.GetCellValue(0, j + 1)]))

        print(LL1Table[grid.GetCellValue(1, 0)][grid.GetCellValue(0, 1)])

        self.Show()




##############句子的分析###############

def analyze():
    temp = input('输入句子')
    global a
    inputstr = '#'+temp+'#'
    inputstr = inputstr[1:]
    inputstr = list(inputstr[::-1])
    print(inputstr)
    process = list()
    process.append('#')  # "#"入栈
    process.append(list(Grammar.keys())[0])  # 开始符入栈
    errorflag = 0  # 出错标识
    count = 0  # 插入列表时的索引
    ProcessList.clear()
    ProcessList[count] = (''.join(process), ''.join(inputstr), ' ', 'init')
    while True:
        count += 1
        current = process.pop()
        if current == inputstr[-1] == '#':  # 分析成功结束
            ProcessList[count] = ('句子', '接受', '', '')
            break

        if current in VT and (current == inputstr[-1]):  # 遇到终结符
            inputstr.pop()
            ProcessList[count] = (''.join(process), ''.join(inputstr), ' ', '读取下一个')
            continue

        if inputstr[-1] in VT:  # 判断是不是终结符
            new = LL1Table[current][inputstr[-1]]
        else:
            errorflag = 1
            ProcessList[count] = (''.join(process), ''.join(inputstr), ' ', 'Error:输入不合法！')
            break

        if new == None:  # 没有找到对应产生式
            errorflag = 1
            ProcessList[count] = (''.join(process), ''.join(inputstr), ' ', 'Error:没有找到对应产生式!')
            break

        if new == '~':  # 产生式为空串
            ProcessList[count] = (''.join(process), ''.join(inputstr), current + '->~', '出栈')
            continue

        for c in reversed(new):  # 将产生式入栈
            process.append(c)
        ProcessList[count] = (''.join(process), ''.join(inputstr), current + '->' + ''.join(new), '出栈、入栈')

    if errorflag == 0:
        print("分析成功！")
    else:
        print("分析失败！")

    items = list(ProcessList.items())
    for i in range(len(items)):
        print(items[i][0],end='  ')
        for j in range(len(items[i][1])):
            print(items[i][1][j], end='  ')
        print(' ')
    # print(items)


def analyze2():
    temp = '(i+i)*i+i*i+i*(i+i)*i*i'
    global a
    inputstr = '#'+temp+'#'
    inputstr = inputstr[1:]
    inputstr = list(inputstr[::-1])
    process = list()
    process.append('#')  # "#"入栈
    process.append(list(Grammar.keys())[0])  # 开始符入栈
    count = 0  # 插入列表时的索引
    while True:
        count += 1
        current = process.pop()
        if current == inputstr[-1] == '#':  # 分析成功结束
            break

        if (current in VT) and (current == inputstr[-1]):  # 遇到终结符
            inputstr.pop()
            continue

        if inputstr[-1] in VT:  # 判断是不是终结符
            new = LL1Table[current][inputstr[-1]]
        else:
            break

        if new == None:  # 没有找到对应产生式
            break

        if new == '~':  # 产生式为空串
            continue

        for c in reversed(new):  # 将产生式入栈
            process.append(c)


get_lan()  # 得到文法
get_first()  # 得到FIRST集
get_follow()  # 得到FOLLOW集s
generate_table()  # 得到分析表

# GUI
app = wx.App(0)
frame = GridFrame(None)
app.MainLoop()


x = 100000
a = time.clock()
print('start')
while x:
    analyze2()  # 对输入字符串进行分析
    x -= 1
b = time.clock()
print(b-a)


'''
E->TM
M->+TM|~
T->FN
N->*FN|~
F->i|(E)
'''

'''
(i+i)*i+i*i+i*(i+i)*i*i+i+i*i+(i*i)+(i+i)*i+i*i+i*(i+i)*i*i+i+i*i+(i*i)*(i+i)*i+i*i+i*(i+i)*i*i+i+i*i+(i*i)
'''

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

182

183

184

185

186

187

188

189

190

191

192

193

194

195

196

197

198

199

200

201

202

203

204

205

206

207

208

209

210

211

212

213

214

215

216

217

218

219

220

221

222

223

224

225

226

227

228

229

230

231

232

233

234

235

236

237

238

239

240

241

242

243

244

245

246

247

248

249

250

251

252

253

254

255

256

257

258

259

260

261

262

263

264

265

266

267

268

import time

import wx

import wx.grid

FIRST = dict() # FIRST集

FOLLOW = dict() # FOLLOW集

Grammar = dict() # 文法

LL1Table = dict() # 分析表

VT = set() # 终结符

ProcessList = dict()

def get_lan():

num = int(input('请输入文法的个数：'))

for i in range(num):

temp = input()

splitlist = temp[3:].replace("\n", "").split("|")

Grammar[temp[0]] = splitlist

def get_first():

for k in Grammar:

l = Grammar[k]

FIRST[k] = list()

for s in l:

if not (s[0].isupper()):

FIRST[k].append(s[0])

for i in range(2):

for k in Grammar:

l = Grammar[k]

for s in l:

if (s[0].isupper()):

FIRST[k].extend(FIRST[s[0]])

FIRST[k] = list(set(FIRST[k])) # 去重

print("文法为：%s" % Grammar)

print("FIRST集为：%s" % FIRST)

def get_follow():

condition = lambda t: t != '~' # 过滤器用于过滤空串

for k in Grammar: # 新建list

FOLLOW[k] = list()

if k == list(Grammar.keys())[0]:

FOLLOW[k].append('#')

for i in range(2):

for k in Grammar:

l = Grammar[k]

for s in l:

if s[len(s) - 1].isupper():

FOLLOW[s[len(s) - 1]].extend(FOLLOW[k]) # 若A→αB是一个产生式，则把FOLLOW(A)加至FOLLOW(B)中

FOLLOW[s[len(s) - 1]] = list(filter(condition, FOLLOW[s[len(s) - 1]])) # 去除空串

for index in range(len(s) - 1):

if s[index].isupper():

if s[index + 1].isupper(): # 若A→αBβ是一个产生式，则把FIRST(β)\{ε}加至FOLLOW(B)中；

FOLLOW[s[index]].extend(FIRST[s[index + 1]])

FOLLOW[s[index]] = list(filter(condition, FOLLOW[s[index]])) # 去除空串

if not (s[index + 1].isupper()) and (s[index + 1] != '~'):

FOLLOW[s[index]].append(s[index + 1])

emptyflag = 1

for i in range(index + 1, len(s)):

if not (s[i].isupper()) or (s[i].isupper() & ('~' not in FIRST[s[i]])):

emptyflag = 0

break

if emptyflag == 1:

FOLLOW[s[index]].extend(FOLLOW[k]) # A→αBβ是一个产生式而(即ε属于FIRST(β))，则把FOLLOW(A)加至FOLLOW(B)中

FOLLOW[s[index]] = list(filter(condition, FOLLOW[s[index]])) # 去除空串

for k in FOLLOW: # 去重

FOLLOW[k] = list(set(FOLLOW[k]))

print('FOLLOW集为：%s' % FOLLOW)

def get_VT():

VT.add('#')

for l in Grammar.values():

for s in l:

for c in s:

if not (c.isupper()) and (c != '~'): VT.add(c)

print('终结符为：%s' % VT)

def generate_table():

get_VT()

for k in Grammar: # 初始化分析表

LL1Table[k] = dict()

for e in VT:

LL1Table[k][e] = None

for k in Grammar:

l = Grammar[k]

for s in l:

if s[0].isupper():

for e in VT:

if e in FIRST[s[0]]: LL1Table[k][e] = s

if s[0] in VT:

LL1Table[k][s[0]] = s

if (s[0].isupper() and ('~' in FIRST[s[0]])) or (s == '~'):

for c in FOLLOW[k]:

LL1Table[k][c] = s

print('分析表为：%s' % LL1Table)

class GridFrame(wx.Frame):

def __init__(self, parent):

global LR0TABLE

wx.Frame.__init__(self, parent)

# Create a wxGrid object

grid = wx.grid.Grid(self, -1)

# Then we call CreateGrid to set the dimensions of the grid

# (100 rows and 10 columns in this example)

grid.CreateGrid(len(list(LL1Table)) + 1, len(VT) + 1)

# We can set the sizes of individual rows and columns

# in pixels

grid.SetCellValue(1, 0, 'E')

grid.SetCellValue(2, 0, 'M')

grid.SetCellValue(3, 0, 'T')

grid.SetCellValue(4, 0, 'N')

grid.SetCellValue(5, 0, 'F')

VTList = list(VT)

VTList.sort(reverse=True)

for i in range(len(list(VT))):

grid.SetCellValue(0, i+1, list(VTList)[i])

for i in range(len(list(LL1Table))):

for j in range(len(list(VT))):

if str(LL1Table[grid.GetCellValue(i + 1, 0)][grid.GetCellValue(0, j + 1)]) != 'None':

grid.SetCellValue(i + 1, j + 1, '->' + str(LL1Table[grid.GetCellValue(i + 1, 0)][grid.GetCellValue(0, j + 1)]))

print(LL1Table[grid.GetCellValue(1, 0)][grid.GetCellValue(0, 1)])

self.Show()

##############句子的分析###############

def analyze():

temp = input('输入句子')

global a

inputstr = '#'+temp+'#'

inputstr = inputstr[1:]

inputstr = list(inputstr[::-1])

print(inputstr)

process = list()

process.append('#') # "#"入栈

process.append(list(Grammar.keys())[0]) # 开始符入栈

errorflag = 0 # 出错标识

count = 0 # 插入列表时的索引

ProcessList.clear()

ProcessList[count] = (''.join(process), ''.join(inputstr), ' ', 'init')

while True:

count += 1

current = process.pop()

if current == inputstr[-1] == '#': # 分析成功结束

ProcessList[count] = ('句子', '接受', '', '')

break

if current in VT and (current == inputstr[-1]): # 遇到终结符

inputstr.pop()

ProcessList[count] = (''.join(process), ''.join(inputstr), ' ', '读取下一个')

continue

if inputstr[-1] in VT: # 判断是不是终结符

new = LL1Table[current][inputstr[-1]]

else:

errorflag = 1

ProcessList[count] = (''.join(process), ''.join(inputstr), ' ', 'Error:输入不合法！')

break

if new == None: # 没有找到对应产生式

errorflag = 1

ProcessList[count] = (''.join(process), ''.join(inputstr), ' ', 'Error:没有找到对应产生式!')

break

if new == '~': # 产生式为空串

ProcessList[count] = (''.join(process), ''.join(inputstr), current + '->~', '出栈')

continue

for c in reversed(new): # 将产生式入栈

process.append(c)

ProcessList[count] = (''.join(process), ''.join(inputstr), current + '->' + ''.join(new), '出栈、入栈')

if errorflag == 0:

print("分析成功！")

else:

print("分析失败！")

items = list(ProcessList.items())

for i in range(len(items)):

print(items[i][0],end=' ')

for j in range(len(items[i][1])):

print(items[i][1][j], end=' ')

print(' ')

# print(items)

def analyze2():

temp = '(i+i)*i+i*i+i*(i+i)*i*i'

global a

inputstr = '#'+temp+'#'

inputstr = inputstr[1:]

inputstr = list(inputstr[::-1])

process = list()

process.append('#') # "#"入栈

process.append(list(Grammar.keys())[0]) # 开始符入栈

count = 0 # 插入列表时的索引

while True:

count += 1

current = process.pop()

if current == inputstr[-1] == '#': # 分析成功结束

break

if (current in VT) and (current == inputstr[-1]): # 遇到终结符

inputstr.pop()

continue

if inputstr[-1] in VT: # 判断是不是终结符

new = LL1Table[current][inputstr[-1]]

else:

break

if new == None: # 没有找到对应产生式

break

if new == '~': # 产生式为空串

continue

for c in reversed(new): # 将产生式入栈

process.append(c)

get_lan() # 得到文法

get_first() # 得到FIRST集

get_follow() # 得到FOLLOW集s

generate_table() # 得到分析表

# GUI

app = wx.App(0)

frame = GridFrame(None)

app.MainLoop()

x = 100000

a = time.clock()

print('start')

while x:

analyze2() # 对输入字符串进行分析

x -= 1

b = time.clock()

print(b-a)

'''

E->TM

M->+TM|~

T->FN

N->*FN|~

F->i|(E)

'''

(i+i)*i+i*i+i*(i+i)*i*i+i+i*i+(i*i)+(i+i)*i+i*i+i*(i+i)*i*i+i+i*i+(i*i)*(i+i)*i+i*i+i*(i+i)*i*i+i+i*i+(i*i)

'''

测试数据

E->TM
M->+TM|~
T->FN
N->*FN|~
F->i|(E)

生成的表

句子分析 i+i*i

编译原理预测分析表自顶向下的语法分析实现

递归下降

预测分析表

流程图

Python代码

测试数据

大模型AlpacaFarm分析

NLG文本评估任务或许并不需要真值或参考文本

大模型中的RepE表征工程

大模型也是一种优化器（LLM as Optimizer）

全栈开发与快速部署Demo

学术idea自动发现与生成

自回归语言模型（language model）Python实现

粉丝期待的三体电影宇宙（近四十部电影与电视剧集）

基于历史对比学习的时序知识图谱推理

泰拉瑞亚Terriaria快速部署Linux服务器

留下评论取消回复

递归下降

预测分析表

流程图

Python代码

测试数据

相关文章

留下评论取消回复