2019-07-28 10:31:56 +08:00
|
|
|
|
// xml.cpp : <20><><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>̨Ӧ<CCA8>ó<EFBFBD><C3B3><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ڵ㡣
|
2014-11-19 00:25:21 +08:00
|
|
|
|
//
|
|
|
|
|
#include "stdafx.h"
|
|
|
|
|
#include <sys/time.h>
|
|
|
|
|
#include "util.h"
|
|
|
|
|
|
|
|
|
|
static void get_html(const char* file)
|
|
|
|
|
{
|
|
|
|
|
acl_xml_tag_init();
|
|
|
|
|
acl_xml_tag_add("img");
|
|
|
|
|
acl_xml_tag_add("BR");
|
|
|
|
|
acl_xml_tag_add("HR");
|
|
|
|
|
|
|
|
|
|
acl::string buf;
|
|
|
|
|
if (acl::ifstream::load(file, &buf) == false)
|
|
|
|
|
{
|
|
|
|
|
printf("load %s error %s\r\n", file, acl::last_serror());
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
struct timeval begin;
|
|
|
|
|
gettimeofday(&begin, NULL);
|
|
|
|
|
|
|
|
|
|
acl::xml xml(buf.c_str());
|
|
|
|
|
const acl::string& text = xml.getText();
|
|
|
|
|
|
|
|
|
|
struct timeval end;
|
|
|
|
|
gettimeofday(&end, NULL);
|
|
|
|
|
|
|
|
|
|
acl::string path(file);
|
|
|
|
|
path << ".txt";
|
|
|
|
|
|
|
|
|
|
acl::ofstream out;
|
|
|
|
|
if (out.open_write(path) == true)
|
|
|
|
|
out.write(text);
|
|
|
|
|
|
|
|
|
|
double spent = util::stamp_sub(&end, &begin);
|
|
|
|
|
printf("text:{%d}, spent: %.2f\r\n", (int) text.length(), spent);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int main(int argc, char* argv[])
|
|
|
|
|
{
|
|
|
|
|
if (argc < 2)
|
|
|
|
|
{
|
|
|
|
|
printf("usage: %s filepath\r\n", argv[0]);
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
get_html(argv[1]);
|
|
|
|
|
return 0;
|
|
|
|
|
}
|