forked from YeeYoungHan/cpphttpstack
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathHttpDownloadAll.cpp
More file actions
112 lines (94 loc) · 2.89 KB
/
Copy pathHttpDownloadAll.cpp
File metadata and controls
112 lines (94 loc) · 2.89 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
/*
* Copyright (C) 2012 Yee Young Han <websearch@naver.com> (http://blog.naver.com/websearch)
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
*/
#include "HttpDownloadAll.h"
bool DownloadFile( const char * pszUrl, const char * pszFileName )
{
CHttpClient clsHttpClient;
std::string strContentType, strBody;
std::string strUrl = pszUrl;
int iUrlLen = strUrl.length();
if( strUrl.at( iUrlLen - 1 ) == '/' )
{
strUrl.append( pszFileName );
}
else
{
strUrl.append( "/" );
strUrl.append( pszFileName );
}
if( clsHttpClient.DoGet( strUrl.c_str(), strContentType, strBody ) == false )
{
printf( "url(%s) get error\n", strUrl.c_str() );
return false;
}
FILE * fd = fopen( pszFileName, "wb" );
if( fd == NULL )
{
printf( "file(%s) open error\n", pszFileName );
return false;
}
fwrite( strBody.c_str(), 1, strBody.length(), fd );
fclose( fd );
return true;
}
int main( int argc, char * argv[] )
{
if( argc != 2 )
{
printf( "[Usage] %s {url}\n", argv[0] );
return 0;
}
char * pszUrl = argv[1];
CHttpClient clsHttpClient;
std::string strContentType, strBody;
CHtmlElement clsHtml;
if( clsHttpClient.DoGet( pszUrl, strContentType, strBody ) == false )
{
printf( "url(%s) get error\n", pszUrl );
return 0;
}
clsHtml.Parse( strBody.c_str(), strBody.length() );
CHtmlElement * pclsHtmlBody = clsHtml.SelectElement( "body" );
if( pclsHtmlBody == NULL )
{
printf( "html -> body is not found\n" );
return 0;
}
CHtmlElement * pclsHtmlPre = pclsHtmlBody->SelectElement( "pre" );
if( pclsHtmlPre == NULL )
{
printf( "html -> body -> pre is not found\n" );
return 0;
}
HTML_ELEMENT_LIST clsAList;
HTML_ELEMENT_LIST::iterator itAL;
std::string strFileName;
pclsHtmlPre->SelectElementList( "a", clsAList );
for( itAL = clsAList.begin(); itAL != clsAList.end(); ++itAL )
{
if( itAL->SelectAttribute( "href", strFileName ) )
{
if( !strncmp( strFileName.c_str(), "..", 2 ) ) continue;
if( strstr( strFileName.c_str(), "/" ) ) continue;
if( IsExistFile( strFileName.c_str() ) ) continue;
printf( "[%s]\n", strFileName.c_str() );
DownloadFile( pszUrl, strFileName.c_str() );
}
}
return 0;
}