135 lines
2.7 KiB
C++
135 lines
2.7 KiB
C++
#include "common.h"
|
|
#include "huffman.h"
|
|
#define pb push_back
|
|
|
|
|
|
|
|
int getweight(string s)
|
|
{
|
|
if(s[0]=='$')
|
|
return 1000;
|
|
else if(s=="farmer"||s.length()==1||s=="example")return 1;
|
|
else return 10;
|
|
}
|
|
struct clause
|
|
{
|
|
vector<string> words;
|
|
vector<int> weights;
|
|
string s;
|
|
int weight;
|
|
void parse()
|
|
{
|
|
string word="";
|
|
bool iseq=false;
|
|
for(int j=0;j<s.length();j++)
|
|
{
|
|
if(s.at(j)=='$') iseq=!iseq;
|
|
if(('a'<=s.at(j)&&s.at(j)<='z')||('A'<=s.at(j)&&s.at(j)<='Z')||('0'<=s.at(j)&&s.at(j)<='9')||(iseq&&s.at(j)!=' '))
|
|
word+=('A'<=s.at(j)&&s.at(j)<='Z')?(s.at(j)-'A'+'a'):(s.at(j));
|
|
else
|
|
{
|
|
if(!iseq)
|
|
{
|
|
if(word!="")words.pb(word);
|
|
word="";
|
|
}
|
|
}
|
|
}
|
|
if(word!="") words.pb(word);
|
|
}
|
|
void calcweight()
|
|
{
|
|
for(auto& w: words)weights.pb(getweight(w));
|
|
weight=-100000;
|
|
for(auto& w : weights)if(w>weight)weight=w;
|
|
}
|
|
};
|
|
struct sentence
|
|
{
|
|
vector<clause> clauses;
|
|
string s;
|
|
int weight;
|
|
void parse()
|
|
{
|
|
string cl="";
|
|
bool iseq=false;
|
|
for(int j=0;j<s.length();j++)
|
|
{
|
|
if(s.at(j)=='$') iseq=!iseq;
|
|
if(s.at(j)!=','|| iseq) cl+=s.at(j);
|
|
else
|
|
{
|
|
clause tmp;
|
|
tmp.s=cl;clauses.pb(tmp);cl="";
|
|
}
|
|
}
|
|
clause tmp;
|
|
tmp.s=cl;clauses.pb(tmp);
|
|
for(auto& c:clauses) c.parse();
|
|
int numclause=0;
|
|
for(int i=0;i<clauses.size();i++)
|
|
if(clauses[i].words.size()!=0)
|
|
{
|
|
auto tmp=clauses[i];
|
|
clauses[numclause]=tmp;
|
|
numclause++;
|
|
}
|
|
clauses.resize(numclause);
|
|
}
|
|
void calcweight()
|
|
{
|
|
weight=-100000;
|
|
for(auto& c : clauses)
|
|
{
|
|
c.calcweight();
|
|
if(c.weight>weight)weight=c.weight;
|
|
}
|
|
}
|
|
};
|
|
vector<sentence> text;
|
|
vector<int> value;
|
|
string line;
|
|
int b,c;
|
|
void init()
|
|
{
|
|
cin>>c;
|
|
ifstream stin("soc1.txt");
|
|
string sentencefile="";
|
|
bool iseq=false;
|
|
while(getline(stin,line))
|
|
{
|
|
for(int i=0;i<line.length();i++)
|
|
{
|
|
b++;
|
|
if(line.at(i)=='$') iseq=!iseq;
|
|
if((line.at(i)!='.'&&line.at(i)!='?'&&line.at(i)!='!')|| iseq)sentencefile+=line.at(i);
|
|
else
|
|
{
|
|
sentence tmp;tmp.s=sentencefile;text.pb(tmp);
|
|
sentencefile="";
|
|
}
|
|
}
|
|
b++;
|
|
sentencefile+=' ';
|
|
}
|
|
for(auto& i:text)i.parse();
|
|
}
|
|
int main() {
|
|
/*init();
|
|
for(sentence& i:text)
|
|
{
|
|
for(clause& j:i.clauses)
|
|
{
|
|
for(auto k:j.words)
|
|
{
|
|
cout<<k<<endl;
|
|
}
|
|
}
|
|
}*/
|
|
|
|
vector<bool> test = huffman::encode("asdfjkl;1234");
|
|
for (auto b : test) cout << b;
|
|
cout << '\n';
|
|
string s = huffman::decode(test);
|
|
cout << s << '\n';
|
|
} |