diff options
author | rafa_99 <raroma09@gmail.com> | 2021-08-30 14:38:01 +0100 |
---|---|---|
committer | rafa_99 <raroma09@gmail.com> | 2021-08-30 14:38:01 +0100 |
commit | b731bcbf8eada98e647b3d7a5944f65cba78edb7 (patch) | |
tree | cf8e0ce5f4c52e46e971acbd4857c2ca038b83df /utils.c |
Initial development of queryt files
Diffstat (limited to 'utils.c')
-rw-r--r-- | utils.c | 196 |
1 files changed, 196 insertions, 0 deletions
@@ -0,0 +1,196 @@ +#include <stdio.h> +#include <stdlib.h> +#include <string.h> +#include "utils.h" +#include "libs/curl.h" +#include "libs/string.h" + +int tokenCount(char *string, char *delimiter) +{ + int totalCount = 0; + + if (string != NULL && delimiter != NULL) + { + char *auxString = (char *)calloc(strlen(string) + 1, sizeof(char)); + strcpy(auxString, string); + + char *token = strtok(auxString, delimiter); + + while (token != NULL) + { + totalCount++; + token = strtok(NULL, delimiter); + } + + free(auxString); + } + + return totalCount; +} + +char **tokenizer(char *string, char *delimiter) +{ + char **tokens = NULL; + + if (string != NULL && delimiter != NULL) + { + char *auxString = (char *)calloc(strlen(string) + 1, sizeof(char)); + strcpy(auxString, string); + + tokens = (char **)calloc(tokenCount(auxString, delimiter), sizeof(char *)); + char *tempToken = strtok(auxString, delimiter); + + for (int i = 0; tempToken != NULL; i++) + { + tokens[i] = (char *)calloc(strlen(tempToken) + 1, sizeof(char)); + strcpy(tokens[i], tempToken); + tempToken = strtok(NULL, delimiter); + } + + free(auxString); + } + else + { + tokens = (char **)calloc(1, sizeof(char)); + } + + return tokens; +} + +void freeTokens(char **tokens, int size) +{ + if ( size > 0 ) + { + for ( int i = 0; i < size; i++ ) + { + free(tokens[i]); + } + } + free(tokens); +} + +char *queryNormalizer(char *query) +{ + char *norm = NULL; + if (query != NULL && strlen(query) > 0) + { + // Declaring Initial Query Size + int querySize = strlen(query); + + // Calculating Normalized Query Size Allocation + for (int i = 0; i < strlen(query); i++) + { + if (query[i] == '+' || query[i] == '#' || query[i] == '&') + { + querySize += 2; + } + } + + // Allocating Memory + norm = (char *)calloc(querySize + 1, sizeof(char)); + + // Creating New Normalized Query + for (int i = 0, added = 0; i < strlen(query); i++) + { + switch (query[i]) + { + case '+': + /* fall through */ + case '#': + /* fall through */ + case '&': + for (int j = 0; j < 3; j++) + { + switch (j) + { + case 0: + norm[i + j + added] = '%'; + break; + case 1: + norm[i + j + added] = '2'; + break; + case 2: + switch (query[i]) + { + case '+': + norm[i + j + added] = 'B'; + break; + case '#': + norm[i + j + added] = '3'; + break; + case '&': + norm[i + j + added] = '6'; + } + } + } + added += 2; + break; + case ' ': + norm[i + added] = '+'; + break; + default: + norm[i + added] = query[i]; + } + } + } + return norm; +} + +int* jsonDataLimits(int tokenCount, char **tokens, char *topDelimiter, char *bottomDelimiter) +{ + int *limits = (int *) calloc(2, sizeof(int)); + + for (int i = 0; i < tokenCount + 1 && (limits[0] == 0 || limits[1] == 0); i++) + { + if (tokens[i] != NULL && strcmp(tokens[i], topDelimiter) == 0 && strcmp(tokens[i + 1], "=") == 0) + { + limits[0] = i + 2; + } + else if (tokens[i] != NULL && limits[1] == 0 && limits[0] > 0 && strstr(tokens[i], bottomDelimiter) != NULL) + { + limits[1] = i; + } + } + + return limits; +} + +char *curlToJSON(char *url) +{ + char *json = NULL; + + if (url != NULL && strlen(url) > 0) + { + // Setting Up Vars + char jsonVar[] = "ytInitialData", unneededHtml[] = ";</script><script", *htmlPage = downloadPage(url), **tokens = tokenizer(htmlPage, " "); + int numberOfTokens = tokenCount(htmlPage, " "), *limits = jsonDataLimits(numberOfTokens, tokens, jsonVar, unneededHtml); + json = (char *)calloc(1, sizeof(char)); + + // Pre Clearing Unused Memory + free(htmlPage); + + // Creating the JSON String + for (int i = limits[0]; i <= limits[1]; i++) + { + if (i < limits[1]) + { + json = realloc(json, (strlen(json) + strlen(tokens[i]) + 2)); + strcat(json, tokens[i]); + strcat(json, " "); + } + else + { + // Last byte doesn't need a extra space + json = realloc(json, (strlen(json) + strlen(tokens[i]) + 1)); + strcat(json, tokens[i]); + } + } + + json[strlen(json) - strlen(unneededHtml)] = '\0'; + + freeTokens(tokens, numberOfTokens); + free(limits); + } + + return json; +} |