mirror of
https://github.com/AAndyProgram/SCrawler.git
synced 2026-03-14 15:52:18 +00:00
YT MusicPlaylistsForm, VideoOptionsForm: add audio bitrate option MediaItem: update type icon; update confirmation dialog for deleting non-single object Track: update extension PlayList: update 'ToString' information for 'MediaItem' YouTubeMediaContainerBase: add size recalculation; add audio bitrate change; embed thumbnail in the extracted 'mp3' as cover art; update 'DownloadCommand' function; include elements' files in XML for non-single items; update 'Delete' function; update files handling; include generated playlists and cover file in the file list YouTubeSettings: add properties 'DefaultAudioEmbedThumbnail_ExtractedFiles', 'DefaultAudioBitrate', 'DefaultAudioBitrate_crf' Exclude 'drc' from parsing results Fix incorrect file reference when the yt-dlp.exe has a different name SCrawler Base.Declarations: hide 'TokenRefreshIntervalProvider' error Base.DeclaredNames: remove 'Header_FB_FRIENDLY_NAME' const (use 'API.Instagram.UserData.GQL') Base.M3U8Base: add 'SkipBroken' argument Base.UserDataBase: add size recalculation (STD) Base.SiteSettingsBase: add 'SettingsVersion' property TDownloader: delete 'RenameOldFileNames' function SiteEditorForm: remove begin/end update of global settings when updating MainFrame: update 'BTT_DOWN_SPEC' tooltip SettingsHostCollection, SettingsHost: move site settings to a personal setting file (delete these settings from the global settings file) DownloadGroupCollection: remove data update during initialization and reindexing SettingsCLS: add 'SettingsVersion' property Add hidden controls API.JustForFans: change m3u8 parsing and downloading algo; remove 'CancellationToken' from m3u8 (replace with 'IThrower') API.Facebook: add option 'RequestsWaitTimer_Any'; add internal option 'DownloadData_Impl'; update GDL names and tokens references; add wait timers API.Threads: add option 'RequestsWaitTimer_Any'; add internal option 'DownloadData_Impl'; update GDL names and tokens references; add wait timers API.Instagram: ADD 'GDL' SUPPORT; add 'UpdateWwwClaim' to 'Declarations.UpdateResponser' and 'UserData'; add additional 'HH_IG_WWW_CLAIM' properties; add 'RequestsWaitTimer_Any' property; add tooltips for timer controls; update 'LastRequests' environment; update information about requests on the label in the settings form; update reels downloading function
210 lines
12 KiB
VB.net
210 lines
12 KiB
VB.net
' Copyright (C) 2023 Andy https://github.com/AAndyProgram
|
|
' This program is free software: you can redistribute it and/or modify
|
|
' it under the terms of the GNU General Public License as published by
|
|
' the Free Software Foundation, either version 3 of the License, or
|
|
' (at your option) any later version.
|
|
'
|
|
' This program is distributed in the hope that it will be useful,
|
|
' but WITHOUT ANY WARRANTY
|
|
Imports SCrawler.API.Base
|
|
Imports SCrawler.Plugin
|
|
Imports SCrawler.Plugin.Attributes
|
|
Imports PersonalUtilities.Tools.Web.Clients
|
|
Imports PersonalUtilities.Tools.Web.Cookies
|
|
Imports PersonalUtilities.Functions.RegularExpressions
|
|
Imports IG = SCrawler.API.Instagram.SiteSettings
|
|
Namespace API.ThreadsNet
|
|
<Manifest("AndyProgram_ThreadsNet"), SeparatedTasks(1)>
|
|
Friend Class SiteSettings : Inherits SiteSettingsBase
|
|
#Region "Declarations"
|
|
#Region "Authorization"
|
|
<PClonable(Clone:=False)> Protected ReadOnly __HH_CSRF_TOKEN As PropertyValue
|
|
<PropertyOption(ControlText:="x-csrftoken", AllowNull:=True, IsAuth:=True), ControlNumber(0)>
|
|
Friend Overridable ReadOnly Property HH_CSRF_TOKEN As PropertyValue
|
|
Get
|
|
Return __HH_CSRF_TOKEN
|
|
End Get
|
|
End Property
|
|
<PClonable> Protected ReadOnly __HH_IG_APP_ID As PropertyValue
|
|
<PropertyOption(ControlText:="x-ig-app-id", AllowNull:=False, IsAuth:=True), ControlNumber(10)>
|
|
Friend Overridable ReadOnly Property HH_IG_APP_ID As PropertyValue
|
|
Get
|
|
Return __HH_IG_APP_ID
|
|
End Get
|
|
End Property
|
|
<PropertyOption(ControlText:="x-asbd-id", AllowNull:=True, IsAuth:=True), ControlNumber(20), PClonable>
|
|
Friend ReadOnly Property HH_ASBD_ID As PropertyValue
|
|
<PropertyOption(ControlText:="sec-ch-ua", AllowNull:=True, IsAuth:=True,
|
|
InheritanceName:=SettingsCLS.HEADER_DEF_sec_ch_ua), ControlNumber(30), PClonable, PXML(OnlyForChecked:=True)>
|
|
Private ReadOnly Property HH_BROWSER As PropertyValue
|
|
<PropertyOption(ControlText:="sec-ch-ua-full", ControlToolTip:=SettingsCLS.HEADER_DEF_sec_ch_ua_full_version_list, AllowNull:=True, IsAuth:=True,
|
|
InheritanceName:=SettingsCLS.HEADER_DEF_sec_ch_ua_full_version_list), ControlNumber(40), PClonable, PXML(OnlyForChecked:=True)>
|
|
Private ReadOnly Property HH_BROWSER_EXT As PropertyValue
|
|
<PropertyOption(ControlText:="sec-ch-ua-platform-ver", ControlToolTip:=SettingsCLS.HEADER_DEF_sec_ch_ua_platform_version, AllowNull:=True, IsAuth:=True, LeftOffset:=135,
|
|
InheritanceName:=SettingsCLS.HEADER_DEF_sec_ch_ua_platform_version), ControlNumber(50), PClonable, PXML(OnlyForChecked:=True)>
|
|
Friend ReadOnly Property HH_PLATFORM_VER As PropertyValue
|
|
<PropertyOption(ControlText:="UserAgent", IsAuth:=True,
|
|
InheritanceName:=SettingsCLS.HEADER_DEF_UserAgent), ControlNumber(60), PClonable, PXML(OnlyForChecked:=True)>
|
|
Private ReadOnly Property HH_USER_AGENT As PropertyValue
|
|
Private Sub ChangeResponserFields(ByVal PropName As String, ByVal Value As Object)
|
|
If Not PropName.IsEmptyString Then
|
|
Dim f$ = String.Empty
|
|
Dim isUserAgent As Boolean = False
|
|
Select Case PropName
|
|
Case NameOf(HH_IG_APP_ID) : f = IG.Header_IG_APP_ID
|
|
Case NameOf(HH_ASBD_ID) : f = IG.Header_ASBD_ID
|
|
Case NameOf(HH_CSRF_TOKEN) : f = IG.Header_CSRF_TOKEN
|
|
Case NameOf(HH_BROWSER) : f = IG.Header_Browser
|
|
Case NameOf(HH_BROWSER_EXT) : f = IG.Header_BrowserExt
|
|
Case NameOf(HH_PLATFORM_VER) : f = IG.Header_Platform_Verion
|
|
Case NameOf(HH_USER_AGENT) : isUserAgent = True
|
|
End Select
|
|
If Not f.IsEmptyString Then
|
|
Responser.Headers.Remove(f)
|
|
If Not CStr(Value).IsEmptyString Then Responser.Headers.Add(f, CStr(Value))
|
|
ElseIf isUserAgent Then
|
|
Responser.UserAgent = CStr(Value)
|
|
End If
|
|
End If
|
|
End Sub
|
|
#End Region
|
|
#Region "Other properties"
|
|
<PropertyOption(ControlText:="Request timer (any)",
|
|
ControlToolTip:="The timer (in milliseconds) that SCrawler should wait before executing the next request." &
|
|
vbCr & "The default value is 1'000." & vbCr & "The minimum value is 0." & IG.TimersUrgentTip, AllowNull:=False),
|
|
PXML, PClonable>
|
|
Friend ReadOnly Property RequestsWaitTimer_Any As PropertyValue
|
|
<Provider(NameOf(RequestsWaitTimer_Any), FieldsChecker:=True)>
|
|
Private ReadOnly Property RequestsWaitTimer_AnyProvider As IFormatProvider
|
|
<PropertyOption(ControlText:="Download data",
|
|
ControlToolTip:="The internal value indicates that site data should be downloaded." & vbCr &
|
|
"It becomes unchecked when the site returns an error."), PXML>
|
|
Friend ReadOnly Property DownloadData_Impl As PropertyValue
|
|
#End Region
|
|
#End Region
|
|
#Region "Initializer"
|
|
Friend Sub New(ByVal AccName As String, ByVal Temp As Boolean)
|
|
Me.New("Threads", "threads.net", AccName, Temp, My.Resources.SiteResources.ThreadsIcon_192, My.Resources.SiteResources.ThreadsIcon_192.ToBitmap)
|
|
End Sub
|
|
Protected Sub New(ByVal SiteName As String, ByVal CookiesDomain As String, ByVal AccName As String, ByVal Temp As Boolean,
|
|
Optional ByVal __Icon As Icon = Nothing, Optional ByVal __Image As Image = Nothing)
|
|
MyBase.New(SiteName, CookiesDomain, AccName, Temp,
|
|
If(__Icon, My.Resources.SiteResources.ThreadsIcon_192),
|
|
If(__Image, My.Resources.SiteResources.ThreadsIcon_192.ToBitmap))
|
|
_AllowUserAgentUpdate = False
|
|
|
|
Dim app_id$ = String.Empty
|
|
Dim token$ = String.Empty
|
|
Dim asbd$ = String.Empty
|
|
Dim browser$ = String.Empty
|
|
Dim browserExt$ = String.Empty
|
|
Dim platform$ = String.Empty
|
|
Dim useragent$ = String.Empty
|
|
|
|
With Responser
|
|
.Accept = "*/*"
|
|
'URGENT: remove after debug
|
|
.DeclaredError = EDP.SendToLog + EDP.ThrowException
|
|
If .UserAgentExists Then useragent = .UserAgent
|
|
With .Headers
|
|
If .Count > 0 Then
|
|
token = .Value(IG.Header_CSRF_TOKEN)
|
|
app_id = .Value(IG.Header_IG_APP_ID)
|
|
asbd = .Value(IG.Header_ASBD_ID)
|
|
browser = .Value(IG.Header_Browser)
|
|
browserExt = .Value(IG.Header_BrowserExt)
|
|
platform = .Value(IG.Header_Platform_Verion)
|
|
End If
|
|
.Add(HttpHeaderCollection.GetSpecialHeader(MyHeaderTypes.Authority, "www.threads.net"))
|
|
.Add(HttpHeaderCollection.GetSpecialHeader(MyHeaderTypes.Origin, "https://www.threads.net"))
|
|
.Add("Upgrade-Insecure-Requests", 1)
|
|
.Add("Sec-Ch-Ua-Model", "")
|
|
.Add(HttpHeaderCollection.GetSpecialHeader(MyHeaderTypes.SecChUaMobile, "?0"))
|
|
.Add(HttpHeaderCollection.GetSpecialHeader(MyHeaderTypes.SecChUaPlatform, """Windows"""))
|
|
.Add(HttpHeaderCollection.GetSpecialHeader(MyHeaderTypes.SecFetchDest, "empty"))
|
|
.Add(HttpHeaderCollection.GetSpecialHeader(MyHeaderTypes.SecFetchMode, "cors"))
|
|
.Add(HttpHeaderCollection.GetSpecialHeader(MyHeaderTypes.SecFetchSite, "same-origin"))
|
|
.Add("Sec-Fetch-User", "?1")
|
|
.Add(Instagram.UserData.GQL_HEADER_FB_FRINDLY_NAME, "BarcelonaProfileThreadsTabRefetchableQuery")
|
|
End With
|
|
.CookiesExtractMode = Responser.CookiesExtractModes.Any
|
|
.CookiesUpdateMode = CookieKeeper.UpdateModes.ReplaceByNameAll
|
|
.CookiesExtractedAutoSave = False
|
|
.Cookies.ChangedAllowInternalDrop = False
|
|
.Cookies.Changed = False
|
|
End With
|
|
|
|
__HH_CSRF_TOKEN = New PropertyValue(token, GetType(String), Sub(v) ChangeResponserFields(NameOf(HH_CSRF_TOKEN), v))
|
|
__HH_IG_APP_ID = New PropertyValue(app_id, GetType(String), Sub(v) ChangeResponserFields(NameOf(HH_IG_APP_ID), v))
|
|
HH_ASBD_ID = New PropertyValue(asbd, GetType(String), Sub(v) ChangeResponserFields(NameOf(HH_ASBD_ID), v))
|
|
HH_BROWSER = New PropertyValue(browser, GetType(String), Sub(v) ChangeResponserFields(NameOf(HH_BROWSER), v))
|
|
HH_BROWSER_EXT = New PropertyValue(browserExt, GetType(String), Sub(v) ChangeResponserFields(NameOf(HH_BROWSER_EXT), v))
|
|
HH_PLATFORM_VER = New PropertyValue(platform, GetType(String), Sub(v) ChangeResponserFields(NameOf(HH_PLATFORM_VER), v))
|
|
HH_USER_AGENT = New PropertyValue(useragent, GetType(String), Sub(v) ChangeResponserFields(NameOf(HH_USER_AGENT), v))
|
|
|
|
RequestsWaitTimer_Any = New PropertyValue(1000)
|
|
RequestsWaitTimer_AnyProvider = New IG.TimersChecker(0)
|
|
DownloadData_Impl = New PropertyValue(True)
|
|
|
|
UrlPatternUser = "https://www.threads.net/@{0}"
|
|
UserRegex = RParams.DMS(String.Format(UserRegexDefaultPattern, "threads.net/@"), 1)
|
|
ImageVideoContains = "threads.net"
|
|
End Sub
|
|
#End Region
|
|
#Region "UpdateResponserData"
|
|
Friend Overridable Sub UpdateResponserData(ByVal Resp As Responser)
|
|
With Responser.Cookies
|
|
Dim csrf$ = String.Empty
|
|
.Update(Resp.Cookies)
|
|
If .Changed Then
|
|
Responser.SaveCookies()
|
|
.Changed = False
|
|
csrf = If(.FirstOrDefault(Function(c) c.Name.StringToLower = IG.Header_CSRF_TOKEN_COOKIE)?.Value, String.Empty)
|
|
End If
|
|
If Not csrf.IsEmptyString AndAlso Not AEquals(Of String)(csrf, HH_CSRF_TOKEN.Value) Then HH_CSRF_TOKEN.Value = csrf : Responser.SaveSettings()
|
|
End With
|
|
End Sub
|
|
#End Region
|
|
#Region "GetInstance"
|
|
Friend Overrides Function GetInstance(ByVal What As ISiteSettings.Download) As IPluginContentProvider
|
|
Return New UserData
|
|
End Function
|
|
#End Region
|
|
#Region "BaseAuthExists, GetUserUrl, GetUserPostUrl"
|
|
Friend Overrides Function BaseAuthExists() As Boolean
|
|
Return Responser.CookiesExists And {HH_CSRF_TOKEN, HH_IG_APP_ID}.All(Function(v) ACheck(Of String)(v.Value)) And CBool(DownloadData_Impl.Value)
|
|
End Function
|
|
Friend Overrides Function GetUserUrl(ByVal User As IPluginContentProvider) As String
|
|
Return String.Format(UrlPatternUser, DirectCast(User, UserData).NameTrue)
|
|
End Function
|
|
Friend Overrides Function GetUserPostUrl(ByVal User As UserDataBase, ByVal Media As UserMedia) As String
|
|
Try
|
|
Dim code$ = DirectCast(User, UserData).GetPostCodeById(Media.Post.ID)
|
|
Dim name$ = DirectCast(User, UserData).NameTrue
|
|
If Not code.IsEmptyString Then Return $"https://www.threads.net/@{name}/post/{code}/" Else Return String.Empty
|
|
Catch ex As Exception
|
|
Return ErrorsDescriber.Execute(EDP.SendToLog, ex, "Can't open user's post", String.Empty)
|
|
End Try
|
|
End Function
|
|
#End Region
|
|
#Region "Update"
|
|
Private __Cookies As CookieKeeper = Nothing
|
|
Friend Overrides Sub BeginEdit()
|
|
__Cookies = Responser.Cookies.Copy
|
|
MyBase.BeginEdit()
|
|
End Sub
|
|
Friend Overrides Sub Update()
|
|
If _SiteEditorFormOpened And Responser.CookiesExists Then
|
|
Dim csrf$ = If(Responser.Cookies.FirstOrDefault(Function(c) c.Name.StringToLower = IG.Header_CSRF_TOKEN_COOKIE)?.Value, String.Empty)
|
|
If Not csrf.IsEmptyString Then HH_CSRF_TOKEN.Value = csrf
|
|
If Not __Cookies Is Nothing AndAlso Not __Cookies.ListEquals(Responser.Cookies) Then DownloadData_Impl.Value = True
|
|
End If
|
|
MyBase.Update()
|
|
End Sub
|
|
Friend Overrides Sub EndEdit()
|
|
__Cookies.DisposeIfReady
|
|
MyBase.EndEdit()
|
|
End Sub
|
|
#End Region
|
|
End Class
|
|
End Namespace |