[c++ ,BitTorrent]编程实现解析种子文件_版本1-夏目玲子-ChinaUnix博客

Aimerの博客

首页　| 　博文目录　| 　关于我

夏目玲子

博客访问： 597116
博文数量： 104
博客积分： 0
博客等级：民兵
技术积分： 1559
用户组：普通用户
注册时间： 2014-08-21 00:58

个人简介

锻炼精神,首先要锻炼肉体

文章分类

全部博文（104）

笔试题整理（2）

组合数学（1）

pat（1）
mysql（1）
linux comma（0）
java（10）

IDEA_Junit（1）

netty（2）

zookeeper（5）

configuration（2）
翻译/translate（12）

java_doc（1）

linux_cmd（1）

boost（6）
part three（4）

cereal（0）

openssl（2）

osip（0）
分布式操作系统（1）
脚本（3）

正则表达范式（0）

shell（1）

python（1）
bson（3）
git（3）
BitTorrent（7）
linux（1）
笔试题（3）

数据结构（0）

leetcode 解（1）
数据库源码分析（4）

mysql（0）

emeraldb（3）
学习卡片（1）
数据库原理（1）
计划，心得（1）
C/C++编程（47）

linux（2）

boost（13）

PAT（8）

linux/POSIX（6）

GNU，gcc（0）

STL（0）

algorithm（0）

boost（0）
未分配的博文（0）

文章存档

2018年（1）

2016年（1）

2015年（101）

2014年（1）

我的朋友

GFree_Wi

相关博文

[c++ ,BitTorrent]编程实现解析种子文件_版本1

分类： C/C++

2015-04-16 10:47:47

这篇文章中记录了编程实现解析以 B 编码方式构成的种子文件的不同模块的作用，
和不同方法之间的相互调用的关系。
在程序中使用了 google 的 glog 日志库，详情可以参考前一篇文章:
http://blog.chinaunix.net/uid-28595538-id-4956104.html

平台：linux
编程工具 : g++

// Makefile

点击(此处)折叠或打开

CPPFLAGS = -O3
LDFLAGS = -lglog
all: Main
clean:
rm -f *.o
Main: Main.o parserUtil.o torrentParser.o
g++ -o $@ $^ $(LDFLAGS)

// torrentParser.h

点击(此处)折叠或打开

#ifndef TORRENT_PARSER_H
#define TORRENT_PARSER_H
#include <string>
#include <stdint.h> // int64_t
#include <map>
#include <vector>
#include <iostream>
using namespace std ;
typedef struct _file
{
int64_t file_length ;
string file_path ;
} file_t;
typedef struct _info
{
int64_t piece_length ; // length of each file block (B)
string pieces ; // hash value length of 20*n
bool is_multi_file ;
vector<file_t> file_list ;
} info_t ;
typedef struct _torrent_file
{
string announce ;
vector<string> announce_list ;
string comment ;
string created_by ;
int64_t creation_date ;
string encoding ;
info_t info ;
} torrent_file_t ;
class AnyNode
{
public :
virtual ~AnyNode () {}
virtual void print () = 0 ;
virtual bool parser (string &content) = 0 ;
} ;
class IntegerNode : public AnyNode
{
public :
virtual ~IntegerNode () {}
virtual bool parser( std::string &content ) ;
virtual void print ()
{
cout<<"integer type , value ["<< _value <<"]" <<endl;
}
int64_t _value ;
} ;
class StringNode : public AnyNode
{
public :
virtual ~StringNode () {}
virtual bool parser ( string &content ) ;
virtual void print ()
{
cout<<"string type ,value ["<< _value <<"]"<<endl;
}
string _value ;
} ;
class ListNode : public AnyNode
{
public :
virtual ~ListNode ()
{
for ( vector<AnyNode*>::iterator it = _value_list.begin () ;
it != _value_list.end () ; it++ )
{
delete *it ; // equal delete AnyNode *
}
_value_list.clear () ;
}
virtual bool parser ( string &content ) ;
virtual void print ()
{
cout << "type list "<< endl ;
for ( vector<AnyNode*>::iterator it = _value_list.begin () ;
it != _value_list.end () ; it++ )
{
AnyNode* it1 = *it ;
cout << "value " ;
it1->print () ;
cout << endl ;
}
}
vector<AnyNode*> _value_list ;
} ;
class DictNode : public AnyNode
{
public :
~DictNode ()
{
for ( map<StringNode *, AnyNode*>::iterator it = _value_map.begin () ;
it != _value_map.end () ; it++ )
{
delete it->first ;
delete it->second ;
}
_value_map.clear () ;
}
virtual bool parser ( string &content ) ;
virtual void print ()
{
StringNode *it1 ;
AnyNode *it2 ;
cout << "type dictionary "<< endl ;
for ( map<StringNode *, AnyNode *>::iterator it = _value_map.begin () ;
it != _value_map.end () ; it++ )
{
it1 = it->first ;
it2 = it->second ;
cout << "key " << endl ;
it1->print();
cout << "value " << endl ;
it2->print () ;
}
}
map<StringNode*, AnyNode*> _value_map ;
} ;
class TorrentFile
{
public :
torrent_file_t torrent_file ;
static bool encode ( const string & torrent_file_content ,
torrent_file_t &torrent_structure ) ;
// update date : 2015/4/15 by Aimer
static void get_node_value ( IntegerNode *pIntegerNode , int64_t &integer_value ) ;
static void get_node_value ( StringNode *pStringNode , string &string_value ) ;
static AnyNode *find_target_node ( map<StringNode *, AnyNode*> &hash_map , const string &key ) ;
} ;
#endif

//torrentParser.cpp

点击(此处)折叠或打开

#include <cstdio>
#include <cstring>
#include <iostream>
#include <vector>
#include <map>
#include <glog/logging.h>
#include "parserUtil.h"
#include "torrentParser.h"
using namespace std ;
bool IntegerNode::parser ( string &content )
{
if ( content.empty () )
{
LOG(WARNING)<< "[warnning] in integer's parser content is empty";
return false ;
}
if ( content[0] != 'i' )
{
LOG(WARNING)<< "[warnning] integer's parser content first element illegal";
return false ;
}
uint64_t pos = content.find ( 'e' , 0 ) ;
// find the position of char e from beginning of content
if ( pos == string::npos )
{
LOG(WARNING) << "[warnning] integer's parser content not find char e";
return false ;
}
string s_value = content.substr(1 , pos-1) ;
// extract the sub-string integer from content with out begin 'i' and end 'e'
parserUtils::string_to_integer (s_value , _value ) ;
// transfer string into integer(int64_t)
content = content.erase ( 0 , pos+1 ) ;
LOG(INFO) << "[info] integer's parser extract message "<< _value << " remain message " << content ;
return true ;
}
bool StringNode::parser ( string & content )
{
if ( content.empty () )
{
LOG(WARNING) <<"[warnning] string type's parser content is empty ";
return false ;
}
if ( content.size () < 3 )
{
LOG(WARNING)<<"[warnning] string type's parser content length is illegal" ;
return false ;
}
int64_t pos = content.find (':', 0) ;
// find ':' in string_length:string_content structure
if ( pos == string::npos )
{
LOG(WARNING)<<"[warnning] string type's it is illegal string type with out ':' ";
return false ;
}
int64_t count = 0 ;
parserUtils::string_to_integer (content.substr(0 , pos) , count ) ;
// extract string 's length from content
_value = content.substr (pos+1, count ) ;
cout << " in method string node parser " << _value << endl ;
cout << " length " << count << endl ;
// pos+1 : beginning of the string content , count : length of the string content
content = content.erase (0 , pos+count+1) ;
// pos : number of the length , count : numbers of the string's char
// eraser method erase range [begin , end) 1 should be plus to (pos+count)
LOG(INFO)<<"[info] string type parser extract message "<< _value
<< " remain content " << content ;
return true ;
}
bool ListNode::parser ( string &content )
{
if ( content.empty () )
{
LOG(WARNING)<<"[warnning] list type parser content is empty ";
return false ;
}
if ( content[0] != 'l' )
{
LOG(WARNING)<<"[warnning] list type parser content with out list mark" ;
return false ;
}
content = content.erase ( 0 , 1 ) ;
// delete 'l' from content
while ( !content.empty () )
{
AnyNode *anyNode = NULL ;
if ( content [0] == 'l' )
{
anyNode = new ListNode () ;
}
else if ( content [0] == 'd')
{
anyNode = new DictNode () ;
}
else if ( content [0] == 'i' )
{
anyNode = new IntegerNode () ;
}
else if (content[0] >= '1' && content[0] <= '9')
{
anyNode = new StringNode () ;
}
else
{
LOG(WARNING)<<"[warnning] list parser list contain illegal message" ;
return false;
}
anyNode->parser ( content ) ;
// this method will parse the content into the right value type
// and store it into the memeber value variable (_value , _value_list ,value_map...)
_value_list.push_back ( anyNode ) ;
if ( content[0] == 'e' ) // is it the end of the list type ?
{
// here we arrived the end of the list ,
// we should erase the 'e' in content and break the cycle
content = content.erase ( 0 , 1 ) ;
break ;
}
}// while
LOG(INFO)<<"[info] list type parser remainning content " << content ;
return true ;
}
bool DictNode::parser ( string & content )
{
if ( content[0] != 'd' )
{
LOG(WARNING)<<"dictionary type parser content not begin with 'd' " ;
return false ;
}
if ( content.size () < 3 )
{
LOG(WARNING)<<"dictionary type parser content length illegal " ;
return false ;
}
content = content.erase ( 0 , 1 ) ;
// erase 'd' from content
// dict type : <key: string type><value: any type>
while ( !content.empty () )
{
StringNode *key = new StringNode () ;
key->parser ( content ) ;
// extract key message from content
if ( content.empty () )
{
LOG(INFO) << "[info] content is empty ,break ";
break ;
}
AnyNode *value = NULL ;
if ( content [0] == 'i' )
value = new IntegerNode () ;
else if ( content [0] == 'l' )
value = new ListNode () ;
else if ( content [0] == 'd' )
value = new DictNode () ;
else if ( content[0] >= '1' && content[0] <= '9' )
value = new StringNode () ;
else
{
LOG(WARNING)<<"[warnning] dict type parser dict contains illegal type" ;
return false ;
}
value->parser ( content ) ;
_value_map[key] = value ;
if ( content[0] == 'e' )
{
// arrived the end of the dict ; erase the 'e' in content
content = content.erase( 0 , 1 );
break ;
}
}
return true ;
}
// update date : 2015/4/15 by Aimer
void TorrentFile::get_node_value (StringNode *pStringNode, string &string_value)
{
if ( pStringNode == NULL )
{
LOG(WARNING)<<"[warnning] can not get string type value , empty" ;
string_value = "" ;
}
else
{
string_value = pStringNode->_value ;
}
}
void TorrentFile::get_node_value ( IntegerNode *pIntegerNode , int64_t &integer_value )
{
if ( pIntegerNode == NULL )
{
LOG(WARNING)<<"[warnning] can not get integer type value , empty";
integer_value = -1 ;
}
else
{
integer_value = pIntegerNode->_value ;
}
}
AnyNode * TorrentFile::find_target_node ( map<StringNode*, AnyNode*>&hash_map ,
const string &key )
{
for ( map<StringNode*,AnyNode*>::iterator it_map = hash_map.begin() ;
it_map != hash_map.end() ; it_map++ )
{
StringNode *pStringNode = dynamic_cast<StringNode*>(it_map->first) ;
if ( pStringNode == NULL )
{
LOG(WARNING)<<"[warnning] hash map key is NULL ";
return NULL ;
}
if ( pStringNode->_value == key )
return it_map->second ;
}
return NULL ; // not find
}
// following method is used the parser torrent file which is the combination
// of all the B encoding parsers (type: integer , string , list, dict ...)
bool TorrentFile::encode ( const string & torrent_file_content , torrent_file_t &torrent_structure )
{
string file_string = torrent_file_content ;
DictNode *pFileDict = new DictNode () ;
pFileDict->parser ( file_string ) ;
// key word : "announce" ; type: string
get_node_value ( dynamic_cast<StringNode*>
(find_target_node( pFileDict->_value_map , "announce" )) , torrent_structure.announce ) ;
// key word : "created by" ; type : string
get_node_value ( dynamic_cast<StringNode*>
(find_target_node(pFileDict->_value_map, "created by")) , torrent_structure.created_by) ;
// key word : "creatation date" ; type :integer
get_node_value ( dynamic_cast<IntegerNode*>
( find_target_node( pFileDict->_value_map , "creation date")) , torrent_structure.creation_date ) ;
// key word : "comment" ; type : string
get_node_value ( dynamic_cast<StringNode*>
(find_target_node( pFileDict->_value_map , "comment" ) ), torrent_structure.comment ) ;
// key word : "encoding" ; type : string
get_node_value ( dynamic_cast<StringNode*>
(find_target_node (pFileDict->_value_map , "encoding" )), torrent_structure.encoding ) ;
// key word : "announce-list" ; type : list< contain element type : string >
AnyNode *pAnyNode_list = find_target_node ( pFileDict->_value_map , "announce-list" ) ;
if ( pAnyNode_list != NULL) // "announce-list" exists in .torrent file
{
ListNode *pAnnounceList = dynamic_cast<ListNode*>(pAnyNode_list) ;
// traverse the list , extract string into --> torrent_strucutre.announce_list :(vector<string> type)
for ( vector<AnyNode*>::iterator it = pAnnounceList->_value_list.begin () ;
it != pAnnounceList->_value_list.end () ; it++ )
{
string string_announce ;
get_node_value ( dynamic_cast<StringNode*>(*it) , string_announce ) ;
torrent_structure.announce_list.push_back (string_announce) ;
}
}
else
{
LOG(INFO)<<"[info] no key words : exists in torrent file" ;
}
// key word : "info" ; type : dictionary
// if single file mode , dictionary elements type : string
// if multi-file mode , dictionary elements type : string , list < element type : dictinary >
// dictionary element type : string<length>
// list <element type : string>
//
{
// first get info|type : dict ; from pFileDict
AnyNode *pAnyNode_dict = find_target_node ( pFileDict->_value_map , "info") ;
if ( pAnyNode_dict != NULL ) // get "info" key word
{
DictNode *pInfoDict = dynamic_cast<DictNode*>(pAnyNode_dict) ;
// get key word "pieces" from info --------> info.pieces type : string
get_node_value ( dynamic_cast<StringNode*>
(find_target_node( pInfoDict->_value_map , "pieces" )) , torrent_structure.info.pieces ) ;
// get key word "piece_length" from info ---> info.piece_length type : integer
get_node_value ( dynamic_cast<IntegerNode*>
(find_target_node(pInfoDict->_value_map , "piece length")), torrent_structure.info.piece_length ) ;
// get info.files from info ------> info.files type: list
AnyNode *pAnyNode_info_list = find_target_node ( pInfoDict->_value_map , "files" ) ;
if ( pAnyNode_info_list != NULL )
{
LOG(INFO)<<"[info] multi-file mode" ;
torrent_structure.info.is_multi_file = true ;
// files : list type exists , transfer it into ListType *
ListNode *pInfoFileList = dynamic_cast<ListNode*>( pAnyNode_info_list ) ;
// get main dir from info , type : string , k-words "name"
string main_dir ;
get_node_value ( dynamic_cast<StringNode*>
(find_target_node(pInfoDict->_value_map, "name")) , main_dir ) ;
// traverse the list : info.files list with element in dict type
for ( vector<AnyNode*>::iterator it_dict = pInfoFileList->_value_list.begin() ;
it_dict != pInfoFileList->_value_list.end() ; it_dict++ )
{
DictNode *pDictNode = dynamic_cast<DictNode*>(*it_dict) ;
if ( pDictNode != NULL)
{
// here on dict refers a sub file node
// a sub file node contain
// { integer type : file_length , list<string>: file sub-path }
file_t sub_file ;
sub_file.file_path += main_dir ; // first append the main dictionary into sub file
// extract sub file length from pDictNode
get_node_value ( dynamic_cast<IntegerNode*>
(find_target_node( pDictNode->_value_map , "length" ) ) ,
sub_file.file_length ) ;
// extract sub file path from pDictNode
// first find the path-list from pDictNode
AnyNode* pAnyNode_path_list = find_target_node ( pDictNode->_value_map , "path" ) ;
if ( pAnyNode_path_list != NULL )
{
// second if it is not null , transfer it into List type
ListNode *pSubPathList = dynamic_cast<ListNode*>(pAnyNode_path_list) ;
// third traverse the list's _value_list , extract each string
// append them together into the absolute path of subfile
// take care : the *it_sub_path is in type of StringNode *
for ( vector<AnyNode*>::iterator it_sub_path = pSubPathList->_value_list.begin() ;
it_sub_path != pSubPathList->_value_list.end () ; it_sub_path++ )
{
sub_file.file_path += "//" ; // first you should add seperator
get_node_value ( dynamic_cast<StringNode*>(*it_sub_path ),
sub_file.file_path ) ;
}
}
else
{
LOG(WARNING)<<"[warning] oh ,no , sub file path is empty ";
return false ;
}
torrent_structure.info.file_list.push_back (sub_file) ;
}
else
{
LOG(WARNING)<<"[warnning] failed transfer AnyNode* into DictNode* ";
return false ;
}
}
}
else
{
LOG(INFO)<<"[info] single file mode";
torrent_structure.info.is_multi_file = false ;
file_t single_file ;
// get info.files.file_length from info , type : integer , k-words "length"
get_node_value ( dynamic_cast<IntegerNode*>
(find_target_node(pInfoDict->_value_map , "length")) , single_file.file_length) ;
// get info.files.file_name from into , type : string , k-words "name"
get_node_value ( dynamic_cast<StringNode*>
(find_target_node(pInfoDict->_value_map , "name")) , single_file.file_path ) ;
torrent_structure.info.file_list.push_back (single_file) ;
}
}
else
{
LOG(WARNING)<<"[warnning] can not find key word : in torrent file " ;
return false ;
}
}
delete pFileDict ;
return true ;
}

公共类
//parserUtil.h

点击(此处)折叠或打开

#ifndef PARSER_UTIL_H
#define PARSER_UTIL_H
#include <string>
#include <stdint.h>
class parserUtils
{
public :
static void string_to_integer ( std::string value , int64_t &integer );
} ;
#endif

//parserUtil.cpp
在该方法中主要实现了将字符串数字"32167" 转换为数值类型的 32167 的方法实现 string_to_integer

点击(此处)折叠或打开

#include <stdint.h>
#include <string>
#include "parserUtil.h"
using namespace std ;
void parserUtils::string_to_integer ( std::string value , int64_t &integer )
{
int64_t result = 0 ;
int temp = 0 ;
for ( int i = 0 ; i < value.size() ; i++)
{
temp = value[i] -'0' ;
result = result*10 ;
result += temp ;
}
integer = result ;
}

// Main.cpp
主函数调用

点击(此处)折叠或打开

#include <cstdio>
#include <string>
#include <iostream>
#include <glog/logging.h>
#include "torrentParser.h"
#include "parserUtil.h"
using namespace std ;
int main ( int argc , char * argv[] )
{
string content ;
char type ;
AnyNode *pAnyNode = NULL ;
// first let init the google log
google::InitGoogleLogging(argv[0]) ;
// and then set the log file store path
FLAGS_log_dir = "./log/" ;
cout << "input parser's type [i->integer] [s->string] [l->list] [d->dictionary]" << endl ;
cin >> type ;
cout << "input content " << endl ;
cin >> content ;
switch ( type )
{
case 'i':
{
pAnyNode = new IntegerNode () ;
cout << "type of integer:" <<endl ;
pAnyNode->parser ( content ) ;
pAnyNode->print () ;
// update : 2015/4/15 by Aimer
// test get_node_value
int64_t integer_value ;
TorrentFile::get_node_value ( dynamic_cast<IntegerNode*>( pAnyNode) , integer_value ) ;
cout << "integer value "<< integer_value << endl ;
break ;
}
case 's' :
{
pAnyNode = new StringNode () ;
cout << "type of string :" <<endl ;
pAnyNode->parser( content ) ;
pAnyNode->print () ;
// update : 2015/4/15 by Aimer
// test TorrentFile::get_node_value , string type
string string_value ;
TorrentFile::get_node_value ( dynamic_cast<StringNode*>( pAnyNode) , string_value ) ;
cout<< "string value "<< string_value << endl ;
break ;
}
case 'l' :
{
pAnyNode = new ListNode () ;
cout <<"type of list :" <<endl ;
pAnyNode->parser ( content ) ;
pAnyNode->print () ;
break ;
}
case 'd' :
{
pAnyNode = new DictNode () ;
cout <<"type of dictionary" <<endl ;
pAnyNode->parser ( content ) ;
pAnyNode->print () ;
// update : 2015/4/15 , test find_target_node method
string key ;
cout << "input searching key words"<< endl ;
cin>> key ;
AnyNode *pAnyNode_value = TorrentFile::find_target_node ( (dynamic_cast<DictNode*>(pAnyNode))->_value_map, key ) ;
cout << "key->" << key << "value->";
pAnyNode_value->print () ;
break ;
}
default :
cout <<" error not such kind type " << endl ;
break ;
}
// here we begin testing the TorrentFile::encode method
// we need torrent-type file input string , and a null torrent_file_t variable
torrent_file_t torrent_structure ;
string torrent_string;
cout << "input your torrent file content" << endl ;
cin >> torrent_string ;
TorrentFile::encode ( torrent_string, torrent_structure ) ;
return 0 ;
}

github address:
end

阅读(1629) | 评论(0) | 转发(0) |

上一篇：[c++,glog] linux 平台上 glog 使用方法简介

下一篇：[c++ ,BitTorrent]编程实现解析种子文件_版本2

给主人留下些什么吧！~~

感谢所有关心和支持过ChinaUnix的朋友们

16024965号-6