【发布时间】:2020-07-24 11:30:55
【问题描述】:
我想计算每个单词在一堆文本中的出现次数。 我能够计算每个单词及其在一个文本中的出现次数(我将每个单词插入到二叉树中的文本中,并在我在文本中再次找到它时将其加一)但我无法计算每个单词文本。
愚蠢的例子:
文本 1:你好亚当,我的名字是亚当,我想要快乐。 文本 2:你好 sam,他来自哪里?
(每个单词出现在一个文本中) Tree1: adam,2 hello,1 my,1 name,1 is,1 I,1 want,1 to,1 be,1 happy,1 (每个单词出现在所有文本中) Tree2: hello,2 adam,1 sam,1 where,1 is,2 ...
有人可以向我解释我该怎么做吗?或者帮我做一个这样的算法?
我的文件:
节点.hpp
class Node{
private:
Node *left; //left child
Node *right; //right child
std::string num;
public:
int data; //number
Node(); //constructor
void setData(string num, int data); //sets number in node
string getData(); //return numbers from node
int &getOcc();
void setLeft(Node *l); //sets left child pointer
Node* &getLeft(); //returns left child pointer
void setRight(Node *r); //sets right child pointer
Node* &getRight(); //return right child pointer
};
节点.cpp
Node::Node(){
this->left = NULL;
this->right = NULL;
}
void Node::setData(string num, int data){
this->num = num;
this->data = data;
}
string Node::getData(){
return this->num;
}
int &Node::getOcc(){
return this->data;
}
void Node::setLeft(Node *l){
this->left = l;
}
Node* &Node::getLeft(){
return this->left;
}
void Node::setRight(Node *r){
this->right = r;
}
Node* &Node::getRight(){
return this->right;
}
BST.hpp
//BST class
class BST{
private:
Node * root; //root node pointer
public:
BST(); //constructor
~BST(); //destructor
void Insert(string num, int data); //Inserts new number in tree
void InsertIDF(string num, int data); //Inserts new number in tree
bool find(string num); //finds whether a number is present in tree
void min(); //find and print minimum number in the tree
void max(); //find and print maximum number in the tree
void save_file(string filename); //save the tree to file
void Delete(string num); //deletes a number from tree
void LoadFromFile(string filename); //loads numbers from file to tree
void Print(); //print tree to stdout
//private functions used as helper functions in the public operations
private:
void printHelper(Node *root);
bool findHelper(Node *root,string num);
void InsertHelper(Node * ¤t, string num, int data);
void InsertHelperIDF(Node * ¤t, string num, int data);
void findMinHelper(Node* current);
void findMaxHelper(Node * current);
void saveHelper(ofstream &fout, Node* current);
Node* DeleteHelper(Node *current, string num);
Node * findMaximum(Node * n);
void clear(Node *currnt);
};
BST.cpp
BST::BST(){
this->root = NULL; //root is NULL in the start
}
BST::~BST(){
clear(root); //delete all nodes
}
void BST::clear(Node* current){
if(current == NULL)
return;
clear(current->getLeft()); //clear left subtree
clear(current->getRight()); //clear right subtree
delete current; //delete this node
}
void BST::Insert(string num, int data){
InsertHelper(root,num,data); //call helper to insert
}
void BST::InsertHelper( Node * ¤t, string num, int data ){
if ( current == nullptr ){
// create new node to be inserted
current = new Node();
current->setData( num, data );
current->setLeft( nullptr );
current->setRight( nullptr );
} else if ( num < current->getData() ){
InsertHelper( current->getLeft(), num, data );
} else if ( current->getData() < num ){
InsertHelper( current->getRight(), num, data );
} else {
int h = current->getOcc();
h++;
current->setData(num, h);
}
}
void BST::InsertIDF(string num, int data){
InsertHelperIDF(root,num,data); //call helper to insert
}
void BST::InsertHelperIDF( Node * ¤t, string num, int data){
if ( current == nullptr ){
// create new node to be inserted
current = new Node();
current->setData( num, data );
current->setLeft( nullptr );
current->setRight( nullptr );
} else if ( num < current->getData() ){
InsertHelperIDF( current->getLeft(), num, data );
} else if ( current->getData() < num ){
InsertHelperIDF( current->getRight(), num, data );
}
}
void BST::min(){
findMinHelper(root);
}
void BST::findMinHelper(Node* current){
if(current == NULL)
return;
if(current->getLeft() == NULL) //if no node at right
cout<<current->getData(); //current has min data
else
findMinHelper(current->getLeft()); //check on left subtree
}
void BST::max(){
findMaxHelper(root);
}
void BST::findMaxHelper(Node * current){
if(current == NULL)
return;
if(current->getRight() == NULL) //if no node at right
cout<<current->getData(); //current node has max data
else
findMaxHelper(current->getRight()); //check on right subtree
}
void BST::Print(){
printHelper(root);
}
void BST::printHelper(Node *current){
if(current == NULL) //stop if NULL
return;
printHelper(current->getLeft()); //print left tree
cout<<current->getData() << " " << current->getOcc() << " "; //print current node data
printHelper(current->getRight()); //print right tree
}
void BST::Delete(string num){
root = DeleteHelper(root,num);
}
Node* BST::DeleteHelper(Node *current, string num){
if(current == NULL)
return NULL;
Node *tobeReturned;
if (current->getData() == num) { //if key is found
if (current->getLeft() == NULL) { //no node at left
tobeReturned = current->getRight();
delete current;
return tobeReturned; //right subtree should replace this node
} else if (current->getRight() == NULL) {
tobeReturned = current->getLeft();
delete current;
return tobeReturned;
} else {
//find maximum node in the left subtree
Node * maxnode = findMaximum(current->getLeft());
//copy values from max node to this node
// current->setData(maxnode->getData());
//delete the max node
current->setLeft(DeleteHelper(current->getLeft(), num));
}
cout<<"Deleted!!!";
} else { //not found
if (num < current->getData()) {
current->setLeft(DeleteHelper(current->getLeft(),num));
} else {
current->setRight(DeleteHelper(current->getRight(), num));
}
}
return current;
}
Node* BST::findMaximum(Node * n){
if(n->getRight() == NULL) //if no node at right, current is maximum
return n;
return findMaximum(n->getRight()); //find in right subtree
}
这是我的 main.cpp
int x = 0;
// go through each story
for( Histoire * histoire : * histoires ) {
// go through each sentence
for( Phrase p : * histoire ) {
// go through each word
for ( Phrase w : p ){
std::stringstream sstream;
sstream << w;
std::string s = sstream.str();
tree.Insert(s , 1); // here i insert each word in a tree and count its occurence in one text
}
// treeIDF.Insert(t,1);
};
【问题讨论】:
-
家庭作业还是真正的编程任务?如果是第二个,请使用
flex+grep+sort... 您必须指定单词的分解方式(空格、\t、\n 等) -
这是一个家庭作业,但正如你所看到的,我并不是想让别人为我做这件事,我只是找不到如何实现这一点,因为我有 3 个循环
-
您是否需要实施 BST?你能简单地使用
std::map吗? -
我希望这会在一分钟内完成 :(
-
我不确定您的问题在哪里?如果单个文档有效,那么您的 BST 是正确的,如果您可以使用
map进行操作,那么您知道如何处理多个文档。那么,你卡在哪里了?
标签: c++ tree insert binary-tree