mirror of
https://github.com/AAndyProgram/SCrawler.git
synced 2026-03-14 15:52:18 +00:00
Delete old notes and comments API.Facebook: add app-id extraction from page; remove app-id from site requirements; update tokens parsing; update tokens regex API.Instagram: add default function to parse tokens
210 lines
12 KiB
VB.net
210 lines
12 KiB
VB.net
' Copyright (C) 2023 Andy https://github.com/AAndyProgram
|
|
' This program is free software: you can redistribute it and/or modify
|
|
' it under the terms of the GNU General Public License as published by
|
|
' the Free Software Foundation, either version 3 of the License, or
|
|
' (at your option) any later version.
|
|
'
|
|
' This program is distributed in the hope that it will be useful,
|
|
' but WITHOUT ANY WARRANTY
|
|
Imports SCrawler.API.Base
|
|
Imports SCrawler.Plugin
|
|
Imports SCrawler.Plugin.Attributes
|
|
Imports PersonalUtilities.Tools.Web.Clients
|
|
Imports PersonalUtilities.Tools.Web.Cookies
|
|
Imports PersonalUtilities.Functions.RegularExpressions
|
|
Imports IG = SCrawler.API.Instagram.SiteSettings
|
|
Namespace API.ThreadsNet
|
|
<Manifest("AndyProgram_ThreadsNet"), SeparatedTasks(1)>
|
|
Friend Class SiteSettings : Inherits SiteSettingsBase
|
|
#Region "Declarations"
|
|
#Region "Authorization"
|
|
<PClonable(Clone:=False)> Protected ReadOnly __HH_CSRF_TOKEN As PropertyValue
|
|
<PropertyOption(ControlText:="x-csrftoken", AllowNull:=True, IsAuth:=True), ControlNumber(0)>
|
|
Friend Overridable ReadOnly Property HH_CSRF_TOKEN As PropertyValue
|
|
Get
|
|
Return __HH_CSRF_TOKEN
|
|
End Get
|
|
End Property
|
|
<PClonable> Protected ReadOnly __HH_IG_APP_ID As PropertyValue
|
|
<PropertyOption(ControlText:="x-ig-app-id", AllowNull:=False, IsAuth:=True), ControlNumber(10)>
|
|
Friend Overridable ReadOnly Property HH_IG_APP_ID As PropertyValue
|
|
Get
|
|
Return __HH_IG_APP_ID
|
|
End Get
|
|
End Property
|
|
<PropertyOption(ControlText:="x-asbd-id", AllowNull:=True, IsAuth:=True), ControlNumber(20), PClonable>
|
|
Friend ReadOnly Property HH_ASBD_ID As PropertyValue
|
|
<PropertyOption(ControlText:="sec-ch-ua", AllowNull:=True, IsAuth:=True,
|
|
InheritanceName:=SettingsCLS.HEADER_DEF_sec_ch_ua), ControlNumber(30), PClonable, PXML(OnlyForChecked:=True)>
|
|
Private ReadOnly Property HH_BROWSER As PropertyValue
|
|
<PropertyOption(ControlText:="sec-ch-ua-full", ControlToolTip:=SettingsCLS.HEADER_DEF_sec_ch_ua_full_version_list, AllowNull:=True, IsAuth:=True,
|
|
InheritanceName:=SettingsCLS.HEADER_DEF_sec_ch_ua_full_version_list), ControlNumber(40), PClonable, PXML(OnlyForChecked:=True)>
|
|
Private ReadOnly Property HH_BROWSER_EXT As PropertyValue
|
|
<PropertyOption(ControlText:="sec-ch-ua-platform-ver", ControlToolTip:=SettingsCLS.HEADER_DEF_sec_ch_ua_platform_version, AllowNull:=True, IsAuth:=True, LeftOffset:=135,
|
|
InheritanceName:=SettingsCLS.HEADER_DEF_sec_ch_ua_platform_version), ControlNumber(50), PClonable, PXML(OnlyForChecked:=True)>
|
|
Friend ReadOnly Property HH_PLATFORM_VER As PropertyValue
|
|
<PropertyOption(ControlText:="UserAgent", IsAuth:=True,
|
|
InheritanceName:=SettingsCLS.HEADER_DEF_UserAgent), ControlNumber(60), PClonable, PXML(OnlyForChecked:=True)>
|
|
Private ReadOnly Property HH_USER_AGENT As PropertyValue
|
|
Private Sub ChangeResponserFields(ByVal PropName As String, ByVal Value As Object)
|
|
If Not PropName.IsEmptyString Then
|
|
Dim f$ = String.Empty
|
|
Dim isUserAgent As Boolean = False
|
|
Select Case PropName
|
|
Case NameOf(HH_IG_APP_ID) : f = IG.Header_IG_APP_ID
|
|
Case NameOf(HH_ASBD_ID) : f = IG.Header_ASBD_ID
|
|
Case NameOf(HH_CSRF_TOKEN) : f = IG.Header_CSRF_TOKEN
|
|
Case NameOf(HH_BROWSER) : f = IG.Header_Browser
|
|
Case NameOf(HH_BROWSER_EXT) : f = IG.Header_BrowserExt
|
|
Case NameOf(HH_PLATFORM_VER) : f = IG.Header_Platform_Verion
|
|
Case NameOf(HH_USER_AGENT) : isUserAgent = True
|
|
End Select
|
|
If Not f.IsEmptyString Then
|
|
Responser.Headers.Remove(f)
|
|
If Not CStr(Value).IsEmptyString Then Responser.Headers.Add(f, CStr(Value))
|
|
ElseIf isUserAgent Then
|
|
Responser.UserAgent = CStr(Value)
|
|
End If
|
|
End If
|
|
End Sub
|
|
#End Region
|
|
#Region "Other properties"
|
|
<PropertyOption(ControlText:="Request timer (any)",
|
|
ControlToolTip:="The timer (in milliseconds) that SCrawler should wait before executing the next request." &
|
|
vbCr & "The default value is 1'000." & vbCr & "The minimum value is 0." & IG.TimersUrgentTip, AllowNull:=False),
|
|
PXML, PClonable>
|
|
Friend ReadOnly Property RequestsWaitTimer_Any As PropertyValue
|
|
<Provider(NameOf(RequestsWaitTimer_Any), FieldsChecker:=True)>
|
|
Private ReadOnly Property RequestsWaitTimer_AnyProvider As IFormatProvider
|
|
<PropertyOption(ControlText:="Download data",
|
|
ControlToolTip:="The internal value indicates that site data should be downloaded." & vbCr &
|
|
"It becomes unchecked when the site returns an error."), PXML>
|
|
Friend ReadOnly Property DownloadData_Impl As PropertyValue
|
|
#End Region
|
|
#End Region
|
|
#Region "Initializer"
|
|
Friend Sub New(ByVal AccName As String, ByVal Temp As Boolean)
|
|
Me.New("Threads", "threads.net", AccName, Temp, My.Resources.SiteResources.ThreadsIcon_192, My.Resources.SiteResources.ThreadsIcon_192.ToBitmap)
|
|
End Sub
|
|
Protected Sub New(ByVal SiteName As String, ByVal CookiesDomain As String, ByVal AccName As String, ByVal Temp As Boolean,
|
|
Optional ByVal __Icon As Icon = Nothing, Optional ByVal __Image As Image = Nothing)
|
|
MyBase.New(SiteName, CookiesDomain, AccName, Temp,
|
|
If(__Icon, My.Resources.SiteResources.ThreadsIcon_192),
|
|
If(__Image, My.Resources.SiteResources.ThreadsIcon_192.ToBitmap))
|
|
_AllowUserAgentUpdate = False
|
|
|
|
Dim app_id$ = String.Empty
|
|
Dim token$ = String.Empty
|
|
Dim asbd$ = String.Empty
|
|
Dim browser$ = String.Empty
|
|
Dim browserExt$ = String.Empty
|
|
Dim platform$ = String.Empty
|
|
Dim useragent$ = String.Empty
|
|
|
|
With Responser
|
|
.Accept = "*/*"
|
|
If .UserAgentExists Then useragent = .UserAgent
|
|
With .Headers
|
|
If .Count > 0 Then
|
|
token = .Value(IG.Header_CSRF_TOKEN)
|
|
app_id = .Value(IG.Header_IG_APP_ID)
|
|
asbd = .Value(IG.Header_ASBD_ID)
|
|
browser = .Value(IG.Header_Browser)
|
|
browserExt = .Value(IG.Header_BrowserExt)
|
|
platform = .Value(IG.Header_Platform_Verion)
|
|
End If
|
|
.Add(HttpHeaderCollection.GetSpecialHeader(MyHeaderTypes.Authority, "www.threads.net"))
|
|
.Add(HttpHeaderCollection.GetSpecialHeader(MyHeaderTypes.Origin, "https://www.threads.net"))
|
|
.Add("Upgrade-Insecure-Requests", 1)
|
|
.Add("Sec-Ch-Ua-Model", "")
|
|
.Add(HttpHeaderCollection.GetSpecialHeader(MyHeaderTypes.SecChUaMobile, "?0"))
|
|
.Add(HttpHeaderCollection.GetSpecialHeader(MyHeaderTypes.SecChUaPlatform, """Windows"""))
|
|
.Add(HttpHeaderCollection.GetSpecialHeader(MyHeaderTypes.SecFetchDest, "empty"))
|
|
.Add(HttpHeaderCollection.GetSpecialHeader(MyHeaderTypes.SecFetchMode, "cors"))
|
|
.Add(HttpHeaderCollection.GetSpecialHeader(MyHeaderTypes.SecFetchSite, "same-origin"))
|
|
.Add("Sec-Fetch-User", "?1")
|
|
.Add("dht", 1)
|
|
.Add("drp", 1)
|
|
.Add(Instagram.UserData.GQL_HEADER_FB_FRINDLY_NAME, "BarcelonaProfileThreadsTabRefetchableQuery")
|
|
End With
|
|
.CookiesExtractMode = Responser.CookiesExtractModes.Any
|
|
.CookiesUpdateMode = CookieKeeper.UpdateModes.ReplaceByNameAll
|
|
.CookiesExtractedAutoSave = False
|
|
.Cookies.ChangedAllowInternalDrop = False
|
|
.Cookies.Changed = False
|
|
End With
|
|
|
|
__HH_CSRF_TOKEN = New PropertyValue(token, GetType(String), Sub(v) ChangeResponserFields(NameOf(HH_CSRF_TOKEN), v))
|
|
__HH_IG_APP_ID = New PropertyValue(app_id, GetType(String), Sub(v) ChangeResponserFields(NameOf(HH_IG_APP_ID), v))
|
|
HH_ASBD_ID = New PropertyValue(asbd, GetType(String), Sub(v) ChangeResponserFields(NameOf(HH_ASBD_ID), v))
|
|
HH_BROWSER = New PropertyValue(browser, GetType(String), Sub(v) ChangeResponserFields(NameOf(HH_BROWSER), v))
|
|
HH_BROWSER_EXT = New PropertyValue(browserExt, GetType(String), Sub(v) ChangeResponserFields(NameOf(HH_BROWSER_EXT), v))
|
|
HH_PLATFORM_VER = New PropertyValue(platform, GetType(String), Sub(v) ChangeResponserFields(NameOf(HH_PLATFORM_VER), v))
|
|
HH_USER_AGENT = New PropertyValue(useragent, GetType(String), Sub(v) ChangeResponserFields(NameOf(HH_USER_AGENT), v))
|
|
|
|
RequestsWaitTimer_Any = New PropertyValue(1000)
|
|
RequestsWaitTimer_AnyProvider = New IG.TimersChecker(0)
|
|
DownloadData_Impl = New PropertyValue(True)
|
|
|
|
UrlPatternUser = "https://www.threads.net/@{0}"
|
|
UserRegex = RParams.DMS(String.Format(UserRegexDefaultPattern, "threads.net/@"), 1)
|
|
ImageVideoContains = "threads.net"
|
|
End Sub
|
|
#End Region
|
|
#Region "UpdateResponserData"
|
|
Friend Overridable Sub UpdateResponserData(ByVal Resp As Responser)
|
|
With Responser.Cookies
|
|
Dim csrf$ = String.Empty
|
|
.Update(Resp.Cookies)
|
|
If .Changed Then
|
|
Responser.SaveCookies()
|
|
.Changed = False
|
|
csrf = If(.FirstOrDefault(Function(c) c.Name.StringToLower = IG.Header_CSRF_TOKEN_COOKIE)?.Value, String.Empty)
|
|
End If
|
|
If Not csrf.IsEmptyString AndAlso Not AEquals(Of String)(csrf, HH_CSRF_TOKEN.Value) Then HH_CSRF_TOKEN.Value = csrf : Responser.SaveSettings()
|
|
End With
|
|
End Sub
|
|
#End Region
|
|
#Region "GetInstance"
|
|
Friend Overrides Function GetInstance(ByVal What As ISiteSettings.Download) As IPluginContentProvider
|
|
Return New UserData
|
|
End Function
|
|
#End Region
|
|
#Region "BaseAuthExists, GetUserUrl, GetUserPostUrl"
|
|
Friend Overrides Function BaseAuthExists() As Boolean
|
|
Return Responser.CookiesExists And {HH_CSRF_TOKEN, HH_IG_APP_ID}.All(Function(v) ACheck(Of String)(v.Value)) And CBool(DownloadData_Impl.Value)
|
|
End Function
|
|
Friend Overrides Function GetUserUrl(ByVal User As IPluginContentProvider) As String
|
|
Return String.Format(UrlPatternUser, DirectCast(User, UserData).NameTrue)
|
|
End Function
|
|
Friend Overrides Function GetUserPostUrl(ByVal User As UserDataBase, ByVal Media As UserMedia) As String
|
|
Try
|
|
Dim code$ = DirectCast(User, UserData).GetPostCodeById(Media.Post.ID)
|
|
Dim name$ = DirectCast(User, UserData).NameTrue
|
|
If Not code.IsEmptyString Then Return $"https://www.threads.net/@{name}/post/{code}/" Else Return String.Empty
|
|
Catch ex As Exception
|
|
Return ErrorsDescriber.Execute(EDP.SendToLog, ex, "Can't open user's post", String.Empty)
|
|
End Try
|
|
End Function
|
|
#End Region
|
|
#Region "Update"
|
|
Private __Cookies As CookieKeeper = Nothing
|
|
Friend Overrides Sub BeginEdit()
|
|
__Cookies = Responser.Cookies.Copy
|
|
MyBase.BeginEdit()
|
|
End Sub
|
|
Friend Overrides Sub Update()
|
|
If _SiteEditorFormOpened And Responser.CookiesExists Then
|
|
Dim csrf$ = If(Responser.Cookies.FirstOrDefault(Function(c) c.Name.StringToLower = IG.Header_CSRF_TOKEN_COOKIE)?.Value, String.Empty)
|
|
If Not csrf.IsEmptyString Then HH_CSRF_TOKEN.Value = csrf
|
|
If Not __Cookies Is Nothing AndAlso Not __Cookies.ListEquals(Responser.Cookies) Then DownloadData_Impl.Value = True
|
|
End If
|
|
MyBase.Update()
|
|
End Sub
|
|
Friend Overrides Sub EndEdit()
|
|
__Cookies.DisposeIfReady
|
|
MyBase.EndEdit()
|
|
End Sub
|
|
#End Region
|
|
End Class
|
|
End Namespace |