在 C++ 上使用套接字的 http 请求

http request using sockets on c++

我正在尝试使用 Linux 上的套接字发出 HTTP 请求,我的函数现在可以正常工作,但仅适用于 www.google.comwebpage.000webhostapp.com 等简单域。当我尝试添加路径和查询 webpage.000webhostapp.com/folder/file.php?parameter=value 时,它开始失败。

这是我的代码:

#include <iostream>
#include <cstring>
#include <string>
#include <sys/socket.h>
#include <arpa/inet.h>
#include <sys/types.h>
#include <netinet/in.h>
#include <netdb.h>
#include <stdio.h>

int main(){
 int socket_desc;
 struct sockaddr_in serv_addr;
 struct hostent *server;
 char buffer[4096];

 std::string url = "www.exampleweb.com/folder/file.php";

 socket_desc = socket(AF_INET, SOCK_STREAM, 0);
 if(socket_desc < 0){
  std::cout<<"failed to create socket"<<std::endl;
 }

 server = gethostbyname(url.c_str());
 if(server==NULL){std::cout<<"could Not resolve hostname :("<<std::endl;}
 bzero((char *) &serv_addr, sizeof(serv_addr));
 serv_addr.sin_family = AF_INET;
 serv_addr.sin_port = htons(80);
 bcopy((char *)server->h_addr,
         (char *)&serv_addr.sin_addr.s_addr,
         server->h_length);

 if(connect(socket_desc, (struct sockaddr *)&serv_addr, sizeof(serv_addr)) < 0){
   std::cout<<"connection failed :("<<std::endl;
 }
 std::string request = "GET / HTTP/1.1\r\nHost: " + url + "\r\nConnection: close\r\n\r\n";

 if(send(socket_desc, request.c_str(), strlen(request.c_str())+1, 0) < 0){
  std::cout<<"failed to send request..."<<std::endl;
 }
 int n;
 std::string raw_site;
 while((n = recv(socket_desc, buffer, sizeof(buffer)+1, 0)) > 0){
  int i = 0;
        while (buffer[i] >= 32 || buffer[i] == '\n' || buffer[i] == '\r'){

            raw_site+=buffer[i];
            i += 1;
        }
 }

 std::cout<<raw_site<<std::endl;
 return 0;
}

使用 www.google.com,它非常适合请求。

使用 www.example.com/folder/file.php?parameter=value&parameter2=value2,它失败并且 returns "could not resolve hostname"

知道如何解决吗?

我没有使用 curl,也不能将其用于此项目。

gethostbyname()(BTW 已被弃用,您应该使用 getaddrinfo() 代替)不适用于 URLs,仅适用于主机名。

给定一个像http://www.exampleweb.com/folder/file.php?parameter=value&parameter2=value2这样的URL,你需要先把它分解成它的组成部分(阅读RFC 3986),例如:

  • 方案http
  • 主机名www.exampleweb.com
  • 资源路径/folder/file.php
  • 查询?parameter=value&parameter2=value2

然后您可以解析主机的 IP 地址,连接到端口 80(HTTP 的默认端口)上的 IP 地址,因为 URL 没有指定不同的端口,最后发送一个GET 请求资源和查询。

此外,请注意 GET 请求中的 Host header 必须指定 主机名(和端口,如果不同比默认值),而不是整个 URL。而且 HTTP 请求不是 null-terminated 字符串,所以不要发送空终止符。阅读 RFC 2616.

试试这个:

#include <iostream>
#include <cstring>
#include <string>
#include <sys/socket.h>
#include <arpa/inet.h>
#include <sys/types.h>
#include <netinet/in.h>
#include <netdb.h>
#include <stdio.h>

int main(){
    int socket_desc;
    struct sockaddr_in serv_addr;
    struct hostent *server;
    char buffer[4096];

    std::string host = "www.exampleweb.com";
    std::string port = "80";
    std::string resource = "/folder/file.php";
    std::string query = "?parameter=value&parameter2=value2";

    socket_desc = socket(AF_INET, SOCK_STREAM, 0);
    if (socket_desc < 0){
        std::cout << "failed to create socket" << std::endl;
        return 0;
    }

    server = gethostbyname(host.c_str());
    if (server == NULL){
        std::cout << "could Not resolve hostname :(" << std::endl;
        close(socket_desc);
        return 0;
    }

    bzero((char *) &serv_addr, sizeof(serv_addr));
    serv_addr.sin_family = AF_INET;
    serv_addr.sin_port = htons(std::stoi(port));
    bcopy((char *)server->h_addr, (char *)&serv_addr.sin_addr.s_addr, server->h_length);

    if (connect(socket_desc, (struct sockaddr *)&serv_addr, sizeof(serv_addr)) < 0){
        std::cout << "connection failed :(" << std::endl;
        close(socket_desc);
        return 0;
    }

    std::string request = "GET " + resource + query + " HTTP/1.1\r\nHost: " + host + "\r\nConnection: close\r\n\r\n";

    if (send(socket_desc, request.c_str(), request.size(), 0) < 0){
        std::cout << "failed to send request..." << std::endl;
        close(socket_desc);
        return 0;
    }

    int n;
    std::string raw_site;
    while ((n = recv(socket_desc, buffer, sizeof(buffer), 0)) > 0){
        raw_site.append(buffer, n);
    }

    close(socket_desc);

    std::cout << raw_site << std::endl;
    return 0;
}