當我連接到一些網站,它給了我:的WinSock分塊數據編碼
Content-Type: text/html; charset=ISO-8859-1
Connection: close
Transfer-Encoding: chunked
Date: Tue, 01 Jan 2013 18:49:53 GMT
fff8
,並在文件的結尾,它看起來像:
</script><!-- vBadvanced 1-3-9-4-8-0 -->
</body>
</html
1
>
0
但是當我做計算器。 com,它打印出來的效果非常好..它可能在源代碼中有額外的空白行,但這很好..爲什麼其他網站會添加數字?
我該如何解決?另外,我怎樣才能從html本身分離出這個頭文件?
我的代碼如下:
#define _WIN32_WINNT 0x501
#include <iostream>
#include <winsock2.h>
#include <ws2tcpip.h>
#include <stdio.h>
#include <fstream>
#include <vector>
using namespace std;
void Get(string WebPage)
{
WSADATA wsaData;
string Address;
struct addrinfo *result;
struct sockaddr_in *sockaddr_ipv4;
char Buffer[99000];
string Header = "GET/HTTP/1.1\r\n";
Header += "Host: " + WebPage + "\r\n";
Header += "Connection: close\r\n";
Header += "\r\n";
if (WSAStartup(MAKEWORD(2,2), &wsaData) != 0) return;
SOCKET Socket = socket(AF_INET,SOCK_STREAM,IPPROTO_TCP);
getaddrinfo(WebPage.c_str(), NULL, NULL, &result);
if (result->ai_family == AF_INET)
{
sockaddr_ipv4 = (struct sockaddr_in *) result->ai_addr;
Address = inet_ntoa(sockaddr_ipv4->sin_addr);
}
freeaddrinfo(result);
SOCKADDR_IN SockAddr;
memset(&SockAddr, 0, sizeof(SockAddr));
SockAddr.sin_port = htons(80);
SockAddr.sin_family = AF_INET;
SockAddr.sin_addr.s_addr = inet_addr(Address.c_str());
if(connect(Socket,(SOCKADDR*)(&SockAddr),sizeof(SockAddr)) == SOCKET_ERROR) return;
if (send(Socket, Header.c_str(), Header.size(), 0) == SOCKET_ERROR) return;
shutdown(Socket, SD_SEND);
std::string Response;
int bytes = 1;
while (bytes > 0)
{
bytes = recv(Socket, Buffer, sizeof(Buffer), 0);
Buffer[bytes] = '\0';
Response.append(Buffer, bytes);
};
closesocket(Socket);
WSACleanup();
}
int main()
{
Get("google.com");
}
無關,但你不檢查'recv'調用的錯誤。 –
如果您使用C或C++在Windows上執行HTTP,則應該查看WinInet(http://msdn.microsoft.com/en-us/library/windows/desktop/aa385331.aspx)或WinHTTP(http: //msdn.microsoft.com/en-us/library/windows/desktop/aa384273.aspx) –