analyses/set_up_database/get_parlament.R

library(readr)
library(RPostgreSQL)
# General-purpose data wrangling
library(tidyverse)  
# Parsing of HTML/XML files  
library(rvest)    
# String manipulation
library(stringr)   
# Verbose regular expressions
library(rebus)     
# Eases DateTime manipulation
library(lubridate)

# # From within psql
# CREATE DATABASE twitter;
# # Now from command line:
# psql twitter

get_parlament <- function(people = NULL){
  
  # # If null, do everyone
  # if(is.null(people)){
  #   library(gsheet)
  #   if(!'goog.RData' %in% dir()){
  #     goog_people <- gsheet::gsheet2tbl(url = 'https://docs.google.com/spreadsheets/d/1k6_AlqojK47MMqzuFYAzBnDfYXysmUgSseaKvHTb3W4/edit#gid=1425313388')
  #     save(goog_people,
  #          file = 'goog.RData')
  #   } else {
  #     load('goog.RData')
  #   }
  #   people <- tolower(goog_people$username)
  # }
  
  # Parlament de catalunya
  if(is.null(people)){
    library(gsheet)
    if(!'goog_parlament.RData' %in% dir()){
      goog_parlament <- gsheet::gsheet2tbl(url = 'https://docs.google.com/spreadsheets/d/1DBKQi5eN9zT_Pj4J3MRiE3qLXB2VPxvd8BVdSc012Ug/edit#gid=0')
      save(goog_parlament,
           file = 'goog_parlament.RData')
    } else {
      load('goog_parlament.RData')
    }
    people <- tolower(goog_parlament$username)
  }
  people <- people[!is.na(people)]
  people <- sort(unique(people))
 
  # Make sure everything in data is lowercase
  if(!dir.exists('data')){
    dir.create('data')
  }
  
  vilaweb::update_database(people = people, delete_duplicates = FALSE)
  
}
get_parlament()
source('../../R/delete_duplicates_database.R')
delete_duplicates_database()
joebrew/vilaweb documentation built on Sept. 11, 2020, 3:42 a.m.