TTDL-5 Added better error handling

This commit is contained in:
Pijus Kamandulis 2020-02-25 20:12:01 +02:00
parent 1b3f985f42
commit 7a691ad32d
10 changed files with 113 additions and 41 deletions

View File

@ -2,10 +2,12 @@ package client
import ( import (
"context" "context"
"errors"
"github.com/chromedp/chromedp" "github.com/chromedp/chromedp"
"io/ioutil" "io/ioutil"
"log" "log"
"os" "os"
"strings"
"time" "time"
config "../models/config" config "../models/config"
@ -13,9 +15,11 @@ import (
) )
// GetMusicUploads - Get all uploads by given music // GetMusicUploads - Get all uploads by given music
func executeClientAction(url string, jsAction string) string { func executeClientAction(url string, jsAction string) (string, error) {
dir, err := ioutil.TempDir("", "chromedp-example") dir, err := ioutil.TempDir("", "chromedp-example")
utils.CheckErr(err) if err != nil {
return "", err
}
defer os.RemoveAll(dir) defer os.RemoveAll(dir)
opts := append(chromedp.DefaultExecAllocatorOptions[:], opts := append(chromedp.DefaultExecAllocatorOptions[:],
@ -36,15 +40,16 @@ func executeClientAction(url string, jsAction string) string {
ctx, cancel = context.WithTimeout(ctx, time.Duration(config.Config.Deadline)*time.Second) ctx, cancel = context.WithTimeout(ctx, time.Duration(config.Config.Deadline)*time.Second)
defer cancel() defer cancel()
var jsOutput string jsOutput, err := runScrapeWithInfo(ctx, jsAction, url)
jsOutput = runScrapeWithInfo(ctx, jsAction, url) if strings.HasPrefix(jsOutput, "\"ERR:") {
err = errors.New(jsOutput)
return jsOutput }
return jsOutput, err
} }
func runScrapeQuiet(ctx context.Context, jsAction string, url string) string { func runScrapeQuiet(ctx context.Context, jsAction string, url string) (string, error) {
var jsOutput string var jsOutput string
err := chromedp.Run(ctx, if err := chromedp.Run(ctx,
// Navigate to user's page // Navigate to user's page
chromedp.Navigate(url), chromedp.Navigate(url),
// Execute url grabber script // Execute url grabber script
@ -54,33 +59,40 @@ func runScrapeQuiet(ctx context.Context, jsAction string, url string) string {
chromedp.WaitVisible(`video_urls`), chromedp.WaitVisible(`video_urls`),
// Grab url links from our element // Grab url links from our element
chromedp.InnerHTML(`video_urls`, &jsOutput), chromedp.InnerHTML(`video_urls`, &jsOutput),
) ); err != nil {
utils.CheckErr(err) return "", err
return jsOutput
} }
func runScrapeWithInfo(ctx context.Context, jsAction string, url string) string { return jsOutput, nil
}
func runScrapeWithInfo(ctx context.Context, jsAction string, url string) (string, error) {
var jsOutput string var jsOutput string
err := chromedp.Run(ctx, if err := chromedp.Run(ctx,
// Navigate to user's page // Navigate to user's page
chromedp.Navigate(url), chromedp.Navigate(url),
// Execute url grabber script // Execute url grabber script
chromedp.EvaluateAsDevTools(utils.ReadFileAsString("scraper.js"), &jsOutput), chromedp.EvaluateAsDevTools(utils.ReadFileAsString("scraper.js"), &jsOutput),
chromedp.EvaluateAsDevTools(jsAction, &jsOutput), chromedp.EvaluateAsDevTools(jsAction, &jsOutput),
) ); err != nil {
utils.CheckErr(err) return "", err
}
for { for {
err = chromedp.Run(ctx, chromedp.EvaluateAsDevTools("currentState.preloadCount.toString()", &jsOutput)) if err := chromedp.Run(ctx, chromedp.EvaluateAsDevTools("currentState.preloadCount.toString()", &jsOutput)); err != nil {
utils.CheckErr(err) return "", err
}
if jsOutput != "0" { if jsOutput != "0" {
utils.Logf("\rPreloading... Currently loaded %s items.", jsOutput) utils.Logf("\rPreloading... Currently loaded %s items.", jsOutput)
} else { } else {
utils.Logf("\rPreloading...") utils.Logf("\rPreloading...")
} }
err = chromedp.Run(ctx, chromedp.EvaluateAsDevTools("currentState.finished.toString()", &jsOutput)) if err := chromedp.Run(ctx, chromedp.EvaluateAsDevTools("currentState.finished.toString()", &jsOutput)); err != nil {
utils.CheckErr(err) return "", err
}
if jsOutput == "true" { if jsOutput == "true" {
break break
} }
@ -89,13 +101,14 @@ func runScrapeWithInfo(ctx context.Context, jsAction string, url string) string
} }
utils.Log("\nRetrieving items...") utils.Log("\nRetrieving items...")
err = chromedp.Run(ctx, if err := chromedp.Run(ctx,
// Wait until custom js finishes // Wait until custom js finishes
chromedp.WaitVisible(`video_urls`), chromedp.WaitVisible(`video_urls`),
// Grab url links from our element // Grab url links from our element
chromedp.InnerHTML(`video_urls`, &jsOutput), chromedp.InnerHTML(`video_urls`, &jsOutput),
) ); err != nil {
utils.CheckErr(err) return "", err
}
return jsOutput
return jsOutput, nil
} }

View File

@ -5,7 +5,10 @@ import (
) )
// GetMusicUploads - Get all uploads by given music // GetMusicUploads - Get all uploads by given music
func GetMusicUploads(url string) []models.Upload { func GetMusicUploads(url string) ([]models.Upload, error) {
actionOutput := executeClientAction(url, "bootstrapIteratingVideos()") actionOutput, err := executeClientAction(url, "bootstrapIteratingVideos()")
return models.ParseUploads(actionOutput) if err != nil {
return nil, err
}
return models.ParseUploads(actionOutput), nil
} }

View File

@ -5,7 +5,10 @@ import (
) )
// GetUserUploads - Get all uploads by user // GetUserUploads - Get all uploads by user
func GetUserUploads(username string) []models.Upload { func GetUserUploads(username string) ([]models.Upload, error) {
actionOutput := executeClientAction(`https://www.tiktok.com/@`+username, "bootstrapIteratingVideos()") actionOutput, err := executeClientAction(`https://www.tiktok.com/@`+username, "bootstrapIteratingVideos()")
return models.ParseUploads(actionOutput) if err != nil {
return nil, err
}
return models.ParseUploads(actionOutput), nil
} }

View File

@ -5,7 +5,10 @@ import (
) )
// GetVideoDetails - returns details of video // GetVideoDetails - returns details of video
func GetVideoDetails(videoURL string) models.Upload { func GetVideoDetails(videoURL string) (models.Upload, error) {
actionOutput := executeClientAction(videoURL, "bootstrapGetCurrentVideo()") actionOutput, err := executeClientAction(videoURL, "bootstrapGetCurrentVideo()")
return models.ParseUpload(actionOutput) if err != nil {
return models.Upload{}, err
}
return models.ParseUpload(actionOutput), nil
} }

View File

@ -6,5 +6,8 @@ var ErrorCouldNotSerializeJSON = "Could not serialize json for video: %s\n"
// ErrorCouldNotRecogniseURL - // ErrorCouldNotRecogniseURL -
var ErrorCouldNotRecogniseURL = "Could not recognise URL format of string %s" var ErrorCouldNotRecogniseURL = "Could not recognise URL format of string %s"
// ErrorCouldNotGetUserUploads -
var ErrorCouldNotGetUserUploads = "Failed to get user uploads: %s\n"
// ErrorPathNotFound - // ErrorPathNotFound -
var ErrorPathNotFound = "File path %s not found." var ErrorPathNotFound = "File path %s not found."

View File

@ -17,6 +17,7 @@ optStrings = {
classes: { classes: {
feedVideoItem: 'video-feed-item-wrapper', feedVideoItem: 'video-feed-item-wrapper',
modalCloseDisabled: 'disabled', modalCloseDisabled: 'disabled',
titleMessage: 'title',
}, },
tags: { tags: {
resultTag: 'video_urls', resultTag: 'video_urls',
@ -25,6 +26,11 @@ optStrings = {
attributes: { attributes: {
src: "src", src: "src",
}, },
tiktokMessages: [
"Couldn't find this account",
"No videos yet",
"Video currently unavailable",
],
}; };
currentState = { currentState = {
@ -32,12 +38,25 @@ currentState = {
finished: false, finished: false,
}; };
checkForErrors = function() {
var titles = document.getElementsByClassName(optStrings.classes.titleMessage);
debugger;
if (titles && titles.length) {
var error = Array.from(titles).find(x => optStrings.tiktokMessages.includes(x.textContent)).textContent;
if (error) {
createVidUrlElement("ERR: " + error);
return true;
}
}
return false;
};
createVidUrlElement = function(outputObj) { createVidUrlElement = function(outputObj) {
var urlSetElement = document.createElement(optStrings.tags.resultTag); var urlSetElement = document.createElement(optStrings.tags.resultTag);
urlSetElement.innerText = JSON.stringify(outputObj); urlSetElement.innerText = JSON.stringify(outputObj);
document.getElementsByTagName(optStrings.tags.resultParentTag)[0].appendChild(urlSetElement); document.getElementsByTagName(optStrings.tags.resultParentTag)[0].appendChild(urlSetElement);
currentState.finished = true; currentState.finished = true;
} };
buldVidUrlArray = function(finishCallback) { buldVidUrlArray = function(finishCallback) {
var feedItem = document.getElementsByClassName(optStrings.classes.feedVideoItem)[0]; var feedItem = document.getElementsByClassName(optStrings.classes.feedVideoItem)[0];
@ -78,9 +97,10 @@ getCurrentModalVideo = function() {
link: soundHref, link: soundHref,
}, },
}; };
} };
getCurrentVideo = function() { getCurrentVideo = function() {
if(checkForErrors()) return;
var player = document.querySelector(optStrings.selectors.videoPlayer); var player = document.querySelector(optStrings.selectors.videoPlayer);
var vidUrl = player.getAttribute(optStrings.attributes.src); var vidUrl = player.getAttribute(optStrings.attributes.src);
var shareLink = document.querySelector(optStrings.selectors.videoShareInput).value; var shareLink = document.querySelector(optStrings.selectors.videoShareInput).value;
@ -100,13 +120,17 @@ getCurrentVideo = function() {
link: soundHref, link: soundHref,
}, },
}; };
} };
scrollWhileNew = function(finishCallback) { scrollWhileNew = function(finishCallback) {
var state = { count: 0 }; var state = { count: 0 };
var intervalID = window.setInterval(x => { var intervalID = window.setInterval(x => {
var oldCount = state.count; var oldCount = state.count;
state.count = document.getElementsByClassName(optStrings.classes.feedVideoItem).length; state.count = document.getElementsByClassName(optStrings.classes.feedVideoItem).length;
if(checkForErrors()) {
window.clearInterval(intervalID);
return;
}
if (oldCount !== state.count) { if (oldCount !== state.count) {
currentState.preloadCount = state.count; currentState.preloadCount = state.count;
window.scrollTo(0, document.body.scrollHeight); window.scrollTo(0, document.body.scrollHeight);
@ -130,7 +154,7 @@ bootstrapGetCurrentVideo = function() {
var video = getCurrentVideo(); var video = getCurrentVideo();
createVidUrlElement(video); createVidUrlElement(video);
return 'bootstrapGetCurrentVideo'; return 'bootstrapGetCurrentVideo';
} };
init = () => { init = () => {
const newProto = navigator.__proto__; const newProto = navigator.__proto__;

View File

@ -3,6 +3,7 @@ package utils
import ( import (
config "../models/config" config "../models/config"
"fmt" "fmt"
"os"
) )
// Log - Write to std out // Log - Write to std out
@ -23,3 +24,8 @@ func Logf(format string, a ...interface{}) {
func LogFatal(format string, a ...interface{}) { func LogFatal(format string, a ...interface{}) {
panic(fmt.Sprintf(format, a...)) panic(fmt.Sprintf(format, a...))
} }
// LogErr - Write error
func LogErr(format string, a ...interface{}) {
fmt.Fprintf(os.Stderr, format, a...)
}

View File

@ -3,6 +3,7 @@ package workflows
import ( import (
client "../client" client "../client"
config "../models/config" config "../models/config"
res "../resources"
utils "../utils" utils "../utils"
"fmt" "fmt"
"regexp" "regexp"
@ -16,7 +17,11 @@ func CanUseDownloadMusic(url string) bool {
// DownloadMusic - Download all videos by given music // DownloadMusic - Download all videos by given music
func DownloadMusic(url string) { func DownloadMusic(url string) {
uploads := client.GetMusicUploads(url) uploads, err := client.GetMusicUploads(url)
if err != nil {
utils.LogErr(res.ErrorCouldNotGetUserUploads, err.Error())
return
}
uploadCount := len(uploads) uploadCount := len(uploads)
for index, upload := range uploads { for index, upload := range uploads {

View File

@ -3,20 +3,27 @@ package workflows
import ( import (
client "../client" client "../client"
config "../models/config" config "../models/config"
res "../resources"
utils "../utils" utils "../utils"
"fmt" "fmt"
"regexp"
"strings" "strings"
) )
// CanUseDownloadUser - Test's if this workflow can be used for parameter // CanUseDownloadUser - Test's if this workflow can be used for parameter
func CanUseDownloadUser(url string) bool { func CanUseDownloadUser(url string) bool {
match := strings.Contains(url, "/") isURL := strings.Contains(url, "/")
return !match match, _ := regexp.MatchString(".+com\\/@[^\\/]+", url)
return !isURL || match
} }
// DownloadUser - Download all user's videos // DownloadUser - Download all user's videos
func DownloadUser(username string) { func DownloadUser(username string) {
uploads := client.GetUserUploads(username) uploads, err := client.GetUserUploads(username)
if err != nil {
utils.LogErr(res.ErrorCouldNotGetUserUploads, err.Error())
return
}
uploadCount := len(uploads) uploadCount := len(uploads)
downloadDir := fmt.Sprintf("%s/%s", config.Config.OutputPath, username) downloadDir := fmt.Sprintf("%s/%s", config.Config.OutputPath, username)

View File

@ -4,6 +4,7 @@ import (
client "../client" client "../client"
models "../models" models "../models"
config "../models/config" config "../models/config"
res "../resources"
utils "../utils" utils "../utils"
"fmt" "fmt"
"regexp" "regexp"
@ -18,7 +19,11 @@ func CanUseDownloadSingleVideo(url string) bool {
// DownloadSingleVideo - Downloads single video // DownloadSingleVideo - Downloads single video
func DownloadSingleVideo(url string) { func DownloadSingleVideo(url string) {
username := utils.GetUsernameFromString(url) username := utils.GetUsernameFromString(url)
upload := client.GetVideoDetails(url) upload, err := client.GetVideoDetails(url)
if err != nil {
utils.LogErr(res.ErrorCouldNotGetUserUploads, err.Error())
return
}
downloadDir := fmt.Sprintf("%s/%s", config.Config.OutputPath, username) downloadDir := fmt.Sprintf("%s/%s", config.Config.OutputPath, username)
utils.InitOutputDirectory(downloadDir) utils.InitOutputDirectory(downloadDir)