基于trie树的具有联想功能的文本编辑器
之前的软件设计与开发实践课程中,自己构思的大作业题目。做的具有核心功能,但是还欠缺边边角角的小功能和持久化数据结构,先放出来,有机会一点点改。github:https://github.com/chuxiuhong/smarteditor
数据结构,使用过程截图以及源代码如下:

#数据结构
**trie树**
trie树相应的介绍点击链接 https://en.wikipedia.org/wiki/Trie
trie树在python文件中的类型定义
Node定义
#GUI设计界面
首先,用较大的文本文件进行训练,完成trie的树的训练。本文件夹下提供了一个big2.txt文件作为示例。

在之后的输入会弹出提示框
#!/usr/bin/python
# -*- coding: utf-8 -*-
import PyQt4
from PyQt4.QtCore import *
from PyQt4.QtGui import *
import PyQt4.QtCore
import sys
import pickle print '===================start=======================' class Node:
def __init__(self):
self.value = None
self.children = {} # children is of type {char, Node}
self.fre = 0
self.father = None def CMP(a, b):
return b.fre - a.fre class Trie:
def __init__(self):
self.root = Node()
self.choose = []
self.__OpenCorrect__ = 0 def insert(self, key): # key is of type string
# key should be a low-case string, this must be checked here!
node = self.root
for char in key:
if char not in node.children:
child = Node()
node.children[char] = child
child.value = char
child.father = node
node = child
else:
node = node.children[char]
# node.value = key
node.fre += 1 def search(self, key):
node = self.root
for char in key:
if char not in node.children:
return None
else:
node = node.children[char]
return node.value def display_node(self, node):
if (node.value != None):
print node.value
for char in 'abcdefghijklmnopqrstuvwxyz':
if char in node.children:
self.display_node(node.children[char])
return def fallback(self, node):
f_char = ''
while node != self.root:
f_char = node.value + f_char
node = node.father
# print f_char
return f_char def display(self):
self.display_node(self.root) def find_node(self, string):
res_node = self.root
for i in string:
res_node = res_node.children[i]
return res_node def association(self, node):
# 调用此函数前应该先将self.choose恢复成空列表
if (node.value != None):
if node.fre > 0:
self.choose.append(node)
for char in 'abcdefghijklmnopqrstuvwxyz':
if char in node.children:
self.association(node.children[char]) def output_association(self, char):
char = str(char).lower()
self.choose = []
result_list = []
self.association(self.find_node(char))
self.choose.sort(cmp=CMP)
if len(self.choose) > 0:
for i in self.choose:
result_list.append(self.fallback(i))
if self.__OpenCorrect__ == 0:
result_list.insert(1, self.correct(char))
# print 'result_list',result_list
return result_list def correct(self, string):
self.choose = []
p = self.find_node(string[:-1])
self.association(p)
self.choose.sort(cmp=CMP)
if len(self.choose) > 1:
return self.fallback(self.choose[0]) def train(trie, path):
# f = open(r'big2.txt')
f = open(path)
word = f.read()
f.close()
word = word.split(' ')
for i in word:
trie.insert(i) trie = Trie()
trie.__OpenCorrect__ = 0 def save_model(T):
f1 = open("trie.pkl", 'wb')
pickle.dump(T, f1)
f1.close() def load_model(path):
f2 = open(path, 'rb')
trie = pickle.load(f2)
f2.close() print '================= END =====================' class UI(QDialog):
def __init__(self, parent=None):
super(UI, self).__init__(parent)
QSList = QStringList()
# default
# QSList<<'One'<<'Tow'<<'Three'<<'Four'<<'Five'
# instance of Completer class
cmp = Completer(QSList)
global edit
edit = TextEdit()
edit.setFontPointSize(80)
edit.setCompleter(cmp)
self.setWindowTitle(u"智能文本编辑器")
button1 = QPushButton(u"训练模型")
button2 = QPushButton(u"保存文本文件")
button3 = QPushButton(u"打开文本文件")
'''
buttons = QushButton()
'''
'''
定义按钮,()内为按钮名称
'''
self.connect(button1, SIGNAL("clicked()"), self.get_file)
self.connect(button2, SIGNAL("clicked()"), self.func2)
self.connect(button3, SIGNAL("clicked()"), self.func3)
'''
关联按钮与函数格式同上,触发为clicked()单击,最后一个参数为
类内函数
'''
layout = QGridLayout()
layout.addWidget(edit, 0, 1, 1, 5)
layout.addWidget(button1, 2, 1)
layout.addWidget(button2, 2, 3)
layout.addWidget(button3, 2, 5)
'''
按钮布局
'''
self.setLayout(layout)
self.center() def center(self):
screen = QDesktopWidget().screenGeometry()
size = self.geometry()
self.move((screen.width() - size.width()) / 2, (screen.height() - size.height()) / 2) def get_file(self):
s = QFileDialog.getOpenFileName(self, "Open file dialog", "/", "TXT Files(*.txt)")
train(trie, s) def func2(self):
s = QFileDialog.getSaveFileName(self, "文件保存", "C:/", "All Files (*);Text Files (*.txt)")
f = open(s, 'w')
f.write(edit.toPlainText())
f.close() def func3(self):
s = QFileDialog.getOpenFileName(self, "Open file dialog", "/", "TXT Files(*.txt)")
f = open(s)
edit.setText(PyQt4.QtCore.QString(f.read()))
f.close() class TextEdit(QTextEdit):
def __init__(self, parent=None):
super(TextEdit, self).__init__(parent)
self.cmp = None
self.p = ''
self.count = 0 def setCompleter(self, completer):
if self.cmp:
self.disconnect(self.cmp, 0, 0)
self.cmp = completer
if (not self.cmp):
return
self.cmp.setWidget(self)
self.cmp.setCompletionMode(QCompleter.PopupCompletion)
self.cmp.setCaseSensitivity(Qt.CaseInsensitive)
self.connect(self.cmp, SIGNAL('activated(QString)'), self.insertCompletion) def completer(self):
return self.cmp def insertCompletion(self, string): # get cursor position
tc = self.textCursor()
# selectd ranges
tc.movePosition(QTextCursor.StartOfWord, QTextCursor.KeepAnchor) # replace selected ranges
tc.insertText(string)
self.p += str(string)
# set cursor pos back to original pos
self.setTextCursor(tc) def textUnderCursor(self):
tc = self.textCursor()
tc.select(QTextCursor.WordUnderCursor)
return tc.selectedText() def keyPressEvent(self, e):
'''
if e.key() != Qt.Key_Backspace:
self.p = self.p + e.text()
self.count+=1
print 'yes'
else:
self.p = self.p[:-1]
self.count-=1
'''
print 'p ', self.p
print 'pressed >> ', e.text()
if (self.cmp and self.cmp.popup().isVisible()):
if e.key() in (Qt.Key_Enter, Qt.Key_Return, Qt.Key_Escape, Qt.Key_Tab, Qt.Key_Backtab):
e.ignore()
return isShortcut = ((e.modifiers() & Qt.ControlModifier) and e.key() == Qt.Key_E)
if (not self.cmp or not isShortcut):
super(TextEdit, self).keyPressEvent(e) ctrlOrShift = e.modifiers() & (Qt.ControlModifier | Qt.ShiftModifier)
if (not self.cmp or (ctrlOrShift and e.text().isEmpty())):
return eow = QString("~!@#$%^&*()_+{}|:\"<>?,./;'[]\\-=")
hasModifier = (e.modifiers() != Qt.NoModifier) and not ctrlOrShift
completionPrefix = self.textUnderCursor()
# hide popup while matching invalid cases
if (not isShortcut and (hasModifier or e.text().isEmpty() or completionPrefix.length() < 1
or eow.contains(e.text().right(1)))):
self.cmp.popup().hide()
return self.cmp.update(completionPrefix)
self.cmp.popup().setCurrentIndex(self.cmp.completionModel().index(0, 0)) cr = self.cursorRect()
cr.setWidth(self.cmp.popup().sizeHintForColumn(0)
+ self.cmp.popup().verticalScrollBar().sizeHint().width())
word = self.p.split(' ')[:-1]
self.p = ''
for k in xrange(len(word)):
self.p += word[k]
print 'self.p=', self.p
self.cmp.complete(cr) class Completer(QCompleter):
def __init__(self, stringlist, parent=None):
super(Completer, self).__init__(parent)
self.stringlist = stringlist
self.setModel(QStringListModel()) # update function will trigger while the text has been modified
def update(self, completionText):
# generate a new QStringList instance
qsList = QStringList() # generate hint lists which returns by customatic definitions
newList = genMyStrList(completionText)
for item in newList:
qsList.append(item) self.stringlist = qsList
# filteredList = self.stringlist.filter(completionText, Qt.CaseInsensitive)
self.model().setStringList(self.stringlist)
self.popup().setCurrentIndex(self.model().index(0, 0)) # the function below defined a way to generate a string list
def genMyStrList(key):
my_str_list = trie.output_association(key)
return my_str_list def main():
app = QApplication(sys.argv)
app.processEvents()
form = UI()
form.show()
# splash.finish(form)
app.exec_()
window = QMainWindow()
window.statusBar().showMessage('Yuan Ziqi')
menubar = window.menuBar window.setWindowTitle('Auto Complete Demo')
window.resize(400, 200)
window.move(400, 100) edit = TextEdit()
edit.setFontPointSize(40)
edit.setCompleter(cmp)
# bt = addbutton()
# window.addDockWidget(bt)
window.setCentralWidget(edit)
window.show()
sys.exit(app.exec_()) if __name__ == '__main__':
print 'app is running successfully'
main()
基于trie树的具有联想功能的文本编辑器的更多相关文章
- 基于trie树做一个ac自动机
基于trie树做一个ac自动机 #!/usr/bin/python # -*- coding: utf-8 -*- class Node: def __init__(self): self.value ...
- 用trie树实现输入提示功能,输入php函数名,提示php函数
参照刘汝佳的trie树 结构体 #include "stdio.h" #include "stdlib.h" #include "string.h&q ...
- [转] Trie树详解及其应用
一.知识简介 最近在看字符串算法了,其中字典树.AC自动机和后缀树的应用是最广泛的了,下面将会重点介绍下这几个算法的应用. 字典树(Trie)可以保存一些字符串->值 ...
- Trie树详解及其应用
一.知识简介 最近在看字符串算法了,其中字典树.AC自动机和后缀树的应用是最广泛的了,下面将会重点介绍下这几个算法的应用. 字典树(Trie)可以保存一些字符串->值的对 ...
- Trie树也称字典树
Trie树 Trie树也称字典树,因为其效率很高,所以在在字符串查找.前缀匹配等中应用很广泛,其高效率是以空间为代价的. 一.Trie树的原理 利用串构建一个字典树,这个字典树保存了串的公共前缀信息, ...
- LeetCode Implement Trie (Prefix Tree) (实现trie树3个函数:插入,查找,前缀)
题意:实现trie树的3个功能,只含小写字母的串. 思路:老实做即可! class TrieNode { public: TrieNode* chd[]; bool flag; // Initiali ...
- Trie 树(转)
看了很多 Trie 树的介绍, 这篇讲的最好,简单易懂(特别是代码部分),直接转载:http://www.cnblogs.com/dolphin0520/archive/2011/10/11/2207 ...
- 【动画】看动画轻松理解「Trie树」
Trie树 Trie这个名字取自“retrieval”,检索,因为Trie可以只用一个前缀便可以在一部字典中找到想要的单词. 虽然发音与「Tree」一致,但为了将这种 字典树 与 普通二叉树 以示区别 ...
- Trie树(Prefix Tree)介绍
本文用尽量简洁的语言介绍一种树形数据结构 -- Trie树. 一.什么是Trie树 Trie树,又叫字典树.前缀树(Prefix Tree).单词查找树 或 键树,是一种多叉树结构.如下图: 上图是一 ...
随机推荐
- Python标准库--typing
作者:zhbzz2007 出处:http://www.cnblogs.com/zhbzz2007 欢迎转载,也请保留这段声明.谢谢! 1 模块简介 Python 3.5 增加了一个有意思的库--typ ...
- js数组学习整理
原文地址:js数组学习整理 常用的js数组操作方法及原理 1.声明数组的方式 var colors = new Array();//空的数组 var colors = new Array(3); // ...
- 分页插件--根据Bootstrap Paginator改写的js插件
刚刚出来实习,之前实习的公司有一个分页插件,和后端的数据字典约定好了的,基本上是看不到内部是怎么实现的,新公司是做WPF的,好像对于ASP.NET的东西不多,导师扔了一个小系统给我和另一个同事,指了两 ...
- gulp批量打包文件并提取公共文件
gulp是前端开发过程中对代码进行构建的工具,是自动化项目的构建利器. browseriyf是模块化打包工具. 一般情况下,Browserify 会把所有的模块打包成单个文件.单个文件在大多数情况下是 ...
- 完美解决CodeSmith无法获取MySQL表及列Description说明注释的方案
问题描述: CodeSmith是现在比较实用的代码生成器,但是我们发现一个问题: 使用CodeSmith编写MySQL模板的时候,会发现一个问题:MySQL数据表中的列说明获取不到,也就是column ...
- LeetCode All in One 题目讲解汇总(持续更新中...)
终于将LeetCode的免费题刷完了,真是漫长的第一遍啊,估计很多题都忘的差不多了,这次开个题目汇总贴,并附上每道题目的解题连接,方便之后查阅吧~ 477 Total Hamming Distance ...
- 2DToolkit官方文档中文版打地鼠教程(一):初始设置
这是2DToolkit官方文档中 Whack a Mole 打地鼠教程的译文,为了减少文中过多重复操作的翻译,以及一些无必要的句子,这里我假设你有Unity的基础知识(例如了解如何新建Sprite等) ...
- Mono 3.8发布:性能进一步改进,可伸缩性提升
9月4日,Mono 3.8.0发布了.该版本的运行时带来了一些性能和可伸缩性方面的改进,同时完成了向Windows平台的移植. Mono遵循Gnome和Linux内核的版本编号策略,这意味着3.8是3 ...
- 让Mono 4在Raspberry Pi上飞
最近公司有项目想要在树莓派上做,代替原来的工控机(我们是把工控主机当作小的主机用,一台小的工控主机最少也要600左右,而树莓派只要200多).于是,公司买了一个Raspberry Pi B+和一个Ra ...
- C# 线程同步的三类情景
C# 已经提供了我们几种非常好用的类库如 BackgroundWorker.Thread.Task等,借助它们,我们就能够分分钟编写出一个多线程的应用程序. 比如这样一个需求:有一个 Winform ...