商品
了解如何使用网页爬虫 API 获取 Target 的搜索结果。了解请求参数和结构化数据输出。
该 target_product 该 source 旨在检索 Target 产品结果页面。我们可以返回任何您想要的 Target 页面 HTML。此外,我们还可以提供 Target 产品页面的结构化(已解析)输出.
请求示例
下面的示例说明如何获取已解析的 Target 产品页面结果。
curl 'https://realtime.oxylabs.io/v1/queries' \
--user 'USERNAME:PASSWORD' \
-H 'Content-Type: application/json' \
-d '{
"source": "target_product",
"product_id": "91936637",
"render": "html",
"parse": true
}'import requests
from pprint import pprint
# 构建负载(payload)。
payload = {
'source': 'target_product',
'product_id': '91936637',
'render': 'html',
'parse': True,
}
# 获取响应。
response = requests.request(
'POST',
'https://realtime.oxylabs.io/v1/queries',
auth=('user', 'pass1'),
json=payload,
)
# 与返回作业状态和结果 URL 的响应不同,此调用将直接返回
# 带结果的 JSON 响应。
pprint(response.json())const https = require("https");
const username = "USERNAME";
const password = "PASSWORD";
const body = {
source: "target_product",
product_id: "91936637",
render: "html",
parse: true,
};
const options = {
hostname: "realtime.oxylabs.io",
path: "/v1/queries",
method: "POST",
headers: {
"Content-Type": "application/json",
Authorization:
"Basic " + Buffer.from(`${username}:${password}`).toString("base64"),
},
};
const request = https.request(options, (response) => {
let data = "";
response.on("data", (chunk) => {
data += chunk;
});
response.on("end", () => {
const responseData = JSON.parse(data);
console.log(JSON.stringify(responseData, null, 2));
});
});
request.on("error", (error) => {
console.error("Error:", error);
});
request.write(JSON.stringify(body));
request.end();# 您提交的整个字符串必须进行 URL 编码。
https://realtime.oxylabs.io/v1/queries?source=target_product&product_id=91936637&render=html&parse=true&access_token=12345abcde<?php
$params = array(
'source' => 'target_produtc',
'product_id' => '91936637',
'render' => 'html',
'parse' => true
);
$ch = curl_init();
curl_setopt($ch, CURLOPT_URL, "https://realtime.oxylabs.io/v1/queries");
curl_setopt($ch, CURLOPT_RETURNTRANSFER, 1);
curl_setopt($ch, CURLOPT_POSTFIELDS, json_encode($params));
curl_setopt($ch, CURLOPT_POST, 1);
curl_setopt($ch, CURLOPT_USERPWD, "USERNAME" . ":" . "PASSWORD");
$headers = array();
$headers[] = "Content-Type: application/json";
curl_setopt($ch, CURLOPT_HTTPHEADER, $headers);
$result = curl_exec($ch);
echo $result;
if (curl_errno($ch)) {
echo 'Error:' . curl_error($ch);
}
curl_close($ch);package main
import (
"bytes"
"encoding/json"
"fmt"
"io/ioutil"
"net/http"
)
func main() {
const Username = "USERNAME"
const Password = "PASSWORD"
payload := map[string]interface{}{
"source": "target_product",
"product_id": "91936637",
"render": "html",
"parse": true,
}
jsonValue, _ := json.Marshal(payload)
client := &http.Client{}
request, _ := http.NewRequest("POST",
"https://realtime.oxylabs.io/v1/queries",
bytes.NewBuffer(jsonValue),
)
request.SetBasicAuth(Username, Password)
response, _ := client.Do(request)
responseText, _ := ioutil.ReadAll(response.Body)
fmt.Println(string(responseText))
}
using System;
using System.Collections.Generic;
using System.Net.Http;
using System.Net.Http.Json;
using System.Threading.Tasks;
namespace OxyApi
{
class Program
{
static async Task Main()
{
const string Username = "USERNAME";
const string Password = "PASSWORD";
var parameters = new {
source = "target_product",
product_id = "91936637",
render = "html",
parse = true
};
var client = new HttpClient();
Uri baseUri = new Uri("https://realtime.oxylabs.io");
client.BaseAddress = baseUri;
var requestMessage = new HttpRequestMessage(HttpMethod.Post, "/v1/queries");
requestMessage.Content = JsonContent.Create(parameters);
var authenticationString = $"{Username}:{Password}";
var base64EncodedAuthenticationString = Convert.ToBase64String(System.Text.ASCIIEncoding.UTF8.GetBytes(authenticationString));
requestMessage.Headers.Add("Authorization", "Basic " + base64EncodedAuthenticationString);
var response = await client.SendAsync(requestMessage);
var contents = await response.Content.ReadAsStringAsync();
Console.WriteLine(contents);
}
}
}package org.example;
import okhttp3.*;
import org.json.JSONObject;
import java.util.concurrent.TimeUnit;
public class Main implements Runnable {
private static final String AUTHORIZATION_HEADER = "Authorization";
public static final String USERNAME = "USERNAME";
public static final String PASSWORD = "PASSWORD";
public void run() {
JSONObject jsonObject = new JSONObject();
jsonObject.put("source", "target_product");
jsonObject.put("product_id", "91936637");
jsonObject.put("render", "html");
jsonObject.put("parse", true);
Authenticator authenticator = (route, response) -> {
String credential = Credentials.basic(USERNAME, PASSWORD);
return response
.request()
.newBuilder()
.header(AUTHORIZATION_HEADER, credential)
.build();
};
var client = new OkHttpClient.Builder()
.authenticator(authenticator)
.readTimeout(180, TimeUnit.SECONDS)
.build();
var mediaType = MediaType.parse("application/json; charset=utf-8");
var body = RequestBody.create(jsonObject.toString(), mediaType);
var request = new Request.Builder()
.url("https://realtime.oxylabs.io/v1/queries")
.post(body)
.build();
try (var response = client.newCall(request).execute()) {
if (response.body() != null) {
try (var responseBody = response.body()) {
System.out.println(responseBody.string());
}
}
} catch (Exception exception) {
System.out.println("Error: " + exception.getMessage());
}
System.exit(0);
}
public static void main(String[] args) {
new Thread(new Main()).start();
}
}{
"source": "target_product",
"product_id": "91936637",
"geo_location": "美国",
"render": "html",
"parse": true
}在我们的示例中,我们使用同步的 Realtime 集成方法。如果您想使用 Proxy Endpoint 或异步的 Push-Pull 集成,请参阅 集成方法 部分。
请求参数值
通用
- 必填参数
本地化
根据特定商店、履行类型、配送地点调整结果。
参数
说明
类型
fulfillment_type
设置履约类型。可用值为: pickup, delivery, 运输。
字符串
store_id
设置门店位置。
整数
delivery_zip
设置收货邮编位置。
字符串
输出数据字典
产品
HTML 示例

{
"content": {
"url": "https://www.target.com/p/apple-iphone-se-2nd-generation-lte-pre-owned-unlocked-64gb-black/-/A-89278891#lnk=sametab",
"brand": {
"href": "/b/apple/-/N-5y3ej",
"name": "查看全部 Apple"
},
"price": 199.99,
"title": "二手 Apple iPhone SE(第2代)(64GB)解锁版 - 黑色",
"category": "解锁手机",
"currency": "USD",
"description": "二手电子产品看起来像新的一样——对地球和您的钱包更好。 <...> 并在未来继续享受功能和安全更新。",
"rating_score": 3.6,
"parse_status_code": 12000
},
"created_at": "2024-06-13 10:47:53",
"updated_at": "2024-06-13 10:48:19",
"page": 1,
"url": "https://www.target.com/p/apple-iphone-se-2nd-generation-lte-pre-owned-unlocked-64gb-black/-/A-89278891#lnk=sametab",
"job_id": "7206970531281641473",
"status_code": 200,
"parser_type": "target_product"
}JSON 结构
下表详细列出了每个 产品页面 我们解析的元素,以及其描述和数据类型。表中还包含一些元数据。
键
说明
类型
url
产品页面的 URL。
字符串
brand
包含品牌详情的对象。
对象
brand.href
指向品牌页面的 URL。
字符串
brand.name
品牌名称。
字符串
价格
产品的价格。
float
title
产品标题。
字符串
类别
产品的类别。
字符串
货币
价格所使用的货币。
字符串
description
产品的详细描述。
字符串
rating_score
产品的评分分数。
整数
created_at
抓取任务创建的时间戳。
时间戳
updated_at
抓取任务完成的时间戳。
时间戳
parser_type
用于提取数据的解析器类型。
整数
job_id
与抓取任务关联的作业 ID。
字符串
最后更新于
这有帮助吗?

