mirror of
https://github.com/Jackett/Jackett.git
synced 2025-09-17 17:34:09 +02:00

extended refresh header handling to libcurl and safecurl also some minor tweaks needed to have Curl 'behave' with certain servers by adding accept-language header to Curl Added ability/template to allow the user to select their own SiteURL (see BitSoup implementation) with a minor update to ConfigurationData class to prevent the "display text" from disappearing on errors. XSpeeds indexer - updated to handle a case where the returned XML occasionally is null terminated resulting in XML parsing exceptions BitSoup indexer - added user customizable url selection, including some url validation BaseIndexer - cleaned up some of my earlier implementation for accumulating cookies.
198 lines
8.4 KiB
C#
198 lines
8.4 KiB
C#
using AutoMapper;
|
|
using CurlSharp;
|
|
using Jackett.Models;
|
|
using Jackett.Services;
|
|
using NLog;
|
|
using System;
|
|
using System.Collections.Generic;
|
|
using System.IO;
|
|
using System.Linq;
|
|
using System.Net;
|
|
using System.Net.Http;
|
|
using System.Text;
|
|
using System.Threading.Tasks;
|
|
|
|
namespace Jackett.Utils.Clients
|
|
{
|
|
public class UnixSafeCurlWebClient : IWebClient
|
|
{
|
|
IProcessService processService;
|
|
Logger logger;
|
|
IConfigurationService configService;
|
|
|
|
public UnixSafeCurlWebClient(IProcessService p, Logger l, IConfigurationService c)
|
|
{
|
|
processService = p;
|
|
logger = l;
|
|
configService = c;
|
|
}
|
|
|
|
public void Init()
|
|
{
|
|
}
|
|
|
|
public async Task<WebClientByteResult> GetBytes(WebRequest request)
|
|
{
|
|
logger.Debug(string.Format("UnixSafeCurlWebClient:GetBytes(Url:{0})", request.Url));
|
|
var result = await Run(request);
|
|
logger.Debug(string.Format("UnixSafeCurlWebClient: Returning {0} => {1} bytes", result.Status, (result.Content == null ? "<NULL>" : result.Content.Length.ToString())));
|
|
return result;
|
|
}
|
|
|
|
public async Task<WebClientStringResult> GetString(WebRequest request)
|
|
{
|
|
logger.Debug(string.Format("UnixSafeCurlWebClient:GetString(Url:{0})", request.Url));
|
|
var result = await Run(request);
|
|
logger.Debug(string.Format("UnixSafeCurlWebClient: Returning {0} => {1}", result.Status, (result.Content == null ? "<NULL>" : Encoding.UTF8.GetString(result.Content))));
|
|
return Mapper.Map<WebClientStringResult>(result);
|
|
}
|
|
|
|
private async Task<WebClientByteResult> Run(WebRequest request)
|
|
{
|
|
var args = new StringBuilder();
|
|
if (Startup.ProxyConnection != null)
|
|
{
|
|
args.AppendFormat("-x " + Startup.ProxyConnection + " ");
|
|
}
|
|
|
|
args.AppendFormat("--url \"{0}\" ", request.Url);
|
|
|
|
if (request.EmulateBrowser)
|
|
args.AppendFormat("-i -sS --user-agent \"{0}\" ", BrowserUtil.ChromeUserAgent);
|
|
else
|
|
args.AppendFormat("-i -sS --user-agent \"{0}\" ", "Jackett/" + configService.GetVersion());
|
|
|
|
if (!string.IsNullOrWhiteSpace(request.Cookies))
|
|
{
|
|
args.AppendFormat("--cookie \"{0}\" ", request.Cookies);
|
|
}
|
|
|
|
if (!string.IsNullOrWhiteSpace(request.Referer))
|
|
{
|
|
args.AppendFormat("--referer \"{0}\" ", request.Referer);
|
|
}
|
|
|
|
if (!string.IsNullOrEmpty(request.RawBody))
|
|
{
|
|
var postString = StringUtil.PostDataFromDict(request.PostData);
|
|
args.AppendFormat("--data \"{0}\" ", request.RawBody.Replace("\"", "\\\""));
|
|
} else if (request.PostData != null && request.PostData.Count() > 0)
|
|
{
|
|
var postString = StringUtil.PostDataFromDict(request.PostData);
|
|
args.AppendFormat("--data \"{0}\" ", postString);
|
|
}
|
|
|
|
var tempFile = Path.GetTempFileName();
|
|
args.AppendFormat("--output \"{0}\" ", tempFile);
|
|
|
|
if (Startup.DoSSLFix == true)
|
|
{
|
|
// http://stackoverflow.com/questions/31107851/how-to-fix-curl-35-cannot-communicate-securely-with-peer-no-common-encryptio
|
|
// https://git.fedorahosted.org/cgit/mod_nss.git/plain/docs/mod_nss.html
|
|
args.Append("--cipher " + SSLFix.CipherList);
|
|
}
|
|
if (Startup.IgnoreSslErrors == true)
|
|
{
|
|
args.Append("-k ");
|
|
}
|
|
args.Append("-H \"Accept-Language: en-US,en\" ");
|
|
args.Append("-H \"Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8\" ");
|
|
string stdout = null;
|
|
await Task.Run(() =>
|
|
{
|
|
stdout = processService.StartProcessAndGetOutput(System.Environment.OSVersion.Platform == PlatformID.Unix ? "curl" : "curl.exe", args.ToString() , true);
|
|
});
|
|
|
|
var outputData = File.ReadAllBytes(tempFile);
|
|
File.Delete(tempFile);
|
|
stdout = Encoding.UTF8.GetString(outputData);
|
|
var result = new WebClientByteResult();
|
|
var headSplit = stdout.IndexOf("\r\n\r\n");
|
|
if (headSplit < 0)
|
|
throw new Exception("Invalid response");
|
|
var headers = stdout.Substring(0, headSplit);
|
|
if (Startup.ProxyConnection != null)
|
|
{
|
|
// the proxy provided headers too so we need to split headers again
|
|
var headSplit1 = stdout.IndexOf("\r\n\r\n",headSplit + 4);
|
|
if (headSplit1 > 0)
|
|
{
|
|
headers = stdout.Substring(headSplit + 4,headSplit1 - (headSplit + 4));
|
|
headSplit = headSplit1;
|
|
}
|
|
}
|
|
var headerCount = 0;
|
|
var cookieBuilder = new StringBuilder();
|
|
var cookies = new List<Tuple<string, string>>();
|
|
|
|
foreach (var header in headers.Split(new char[] { '\n', '\r' }, StringSplitOptions.RemoveEmptyEntries))
|
|
{
|
|
if (headerCount == 0)
|
|
{
|
|
var responseCode = int.Parse(header.Split(' ')[1]);
|
|
result.Status = (HttpStatusCode)responseCode;
|
|
}
|
|
else
|
|
{
|
|
var headerSplitIndex = header.IndexOf(':');
|
|
if (headerSplitIndex > 0)
|
|
{
|
|
var name = header.Substring(0, headerSplitIndex).ToLowerInvariant();
|
|
var value = header.Substring(headerSplitIndex + 1);
|
|
switch (name)
|
|
{
|
|
case "set-cookie":
|
|
var nameSplit = value.IndexOf('=');
|
|
if (nameSplit > -1)
|
|
{
|
|
cookies.Add(new Tuple<string, string>(value.Substring(0, nameSplit), value.Substring(0, value.IndexOf(';') + 1)));
|
|
}
|
|
break;
|
|
case "location":
|
|
result.RedirectingTo = value.Trim();
|
|
break;
|
|
case "refresh":
|
|
//"Refresh: 8;URL=/cdn-cgi/l/chk_jschl?pass=1451000679.092-1vJFUJLb9R"
|
|
var redirval = "";
|
|
var start = value.IndexOf("=");
|
|
var end = value.IndexOf(";");
|
|
var len = value.Length;
|
|
if (start > -1)
|
|
{
|
|
redirval = value.Substring(start + 1);
|
|
result.RedirectingTo = redirval;
|
|
// normally we don't want a serviceunavailable (503) to be a redirect, but that's the nature
|
|
// of this cloudflare approach..don't want to alter BaseWebResult.IsRedirect because normally
|
|
// it shoudln't include service unavailable..only if we have this redirect header.
|
|
result.Status = System.Net.HttpStatusCode.Redirect;
|
|
var redirtime = Int32.Parse(value.Substring(0, end));
|
|
System.Threading.Thread.Sleep(redirtime * 1000);
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
headerCount++;
|
|
}
|
|
|
|
foreach (var cookieGroup in cookies.GroupBy(c => c.Item1))
|
|
{
|
|
cookieBuilder.AppendFormat("{0} ", cookieGroup.Last().Item2);
|
|
}
|
|
|
|
result.Cookies = cookieBuilder.ToString().Trim();
|
|
result.Content = new byte[outputData.Length - (headSplit + 3)];
|
|
var dest = 0;
|
|
for (int i = headSplit + 4; i < outputData.Length; i++)
|
|
{
|
|
result.Content[dest] = outputData[i];
|
|
dest++;
|
|
}
|
|
|
|
logger.Debug("WebClientByteResult returned " + result.Status);
|
|
ServerUtil.ResureRedirectIsFullyQualified(request, result);
|
|
return result;
|
|
}
|
|
}
|
|
}
|