You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
390 lines
14 KiB
390 lines
14 KiB
---
|
|
title: "Untitled"
|
|
output: html_document
|
|
---
|
|
|
|
```{r setup, include=FALSE}
|
|
knitr::opts_chunk$set(echo = TRUE)
|
|
```
|
|
|
|
## R Markdown
|
|
|
|
This is an R Markdown document. Markdown is a simple formatting syntax for authoring HTML, PDF, and MS Word documents. For more details on using R Markdown see <http://rmarkdown.rstudio.com>.
|
|
|
|
When you click the **Knit** button a document will be generated that includes both content as well as the output of any embedded R code chunks within the document. You can embed an R code chunk like this:
|
|
|
|
```{r cars}
|
|
oi<-fst::read.fst("./data/open_items.fst")
|
|
# oi %>% mutate(spread=ifelse(spread=="Only less than 5", "Only less than 5 yrs",
|
|
# ifelse(spread==" Only more than 5","Only more than 5 yrs",spread))) %>% fst::write.fst("./data/open_items.fst")
|
|
|
|
id<-read.csv("./data/id.csv", sep=";", header=F)
|
|
library(dplyr)
|
|
indi<-id %>%
|
|
filter(V3=="Identiteitsbewijs") %>%
|
|
select(V2,V4)
|
|
orgs<-id |> dplyr::filter(V3=="KVK – Chamber of Commerce") |> unique()
|
|
disorgs<-read.csv("./data/diorg.csv") |> unique()
|
|
arch<-read.csv("./data/Arch.csv")
|
|
|
|
dead.indi<-arch %>% filter(!is.na(Datum.Overlijden.Nr.)) %>% select(c(Id.Nummer,Datum.Overlijden.Nr.)) %>% mutate(e.status="Passed", type="indi")%>% mutate(Id.Nummer=as.character(Id.Nummer))
|
|
left.indi<-arch %>% filter(!is.na(Datum.Vertrek.Uit.Curacao.Nr.)) %>% select(Id.Nummer)%>% mutate(e.status="Left", type="indi") %>% mutate(Id.Nummer=as.character(Id.Nummer))
|
|
|
|
left.indi<-indi %>% unique() %>% inner_join(left.indi, by=c("V4"="Id.Nummer")) %>% rename(business_partner=V2) %>%
|
|
select(business_partner, e.status, type) %>%
|
|
mutate(Year=c(0)) %>%
|
|
select(business_partner, e.status, Year, type)
|
|
dead.indi<-indi %>% unique() %>% inner_join(dead.indi, by=c("V4"="Id.Nummer")) %>% rename(business_partner=V2) %>%
|
|
mutate(Year=c(0)) %>%
|
|
select(business_partner, e.status, Year, type)
|
|
|
|
disc<-read.csv("./data/coc.csv") %>% unique() %>% select(-X) %>% mutate(Year=ifelse(is.na(Year),0,Year), type=c("org")) %>%
|
|
rename(business_partner=BPC, e.status=Status) %>%
|
|
group_by(business_partner, e.status) %>%
|
|
slice_max(order_by = Year,n=1) %>% select(-Name) %>% mutate(business_partner=as.character(business_partner))
|
|
dead.org<-fst::read.fst("./data/dead.fst") %>% select(V2) %>% rename(business_partner=V2)%>% mutate(e.status="Discontinued", type="org") %>% select(business_partner, e.status, type) %>% mutate(Year=c(0))
|
|
disc.org<-rbind(disc,dead.org) %>% group_by(business_partner) %>% mutate(count=n()) %>%
|
|
group_by(business_partner) %>%
|
|
slice_max(order_by = Year,n=1) %>%
|
|
mutate(count=n()) %>%
|
|
arrange(desc(count), business_partner) %>%
|
|
mutate(rown=row_number()) %>%
|
|
slice_max(order_by = rown,n=1) %>% ungroup() %>% select(-c(count,rown))
|
|
|
|
|
|
|
|
ct<-rbind(disc.org,left.indi,dead.indi)
|
|
|
|
oi<-oi %>% select(-c(e.status)) %>%
|
|
left_join(ct, by="business_partner") %>%
|
|
mutate(e.status=ifelse(is.na(e.status) | e.status=="No results","active",e.status)) %>% select(-c(type))
|
|
|
|
|
|
|
|
|
|
|
|
dunn<-fst::read.fst("./data/dunning.fst")
|
|
last.dunn<-dunn %>%
|
|
group_by(DUNN_GPART, DUNN_VKONT) %>%
|
|
filter(DUNN_DATE==max(DUNN_DATE))%>%
|
|
mutate(DUNN_GPART=as.character(DUNN_GPART))
|
|
|
|
no.cont.dunn<-last.dunn %>%
|
|
filter(is.na(DUNN_VKONT)) %>%
|
|
mutate(DUNN_GPART=as.character(DUNN_GPART)) %>%
|
|
group_by(DUNN_GPART) %>%
|
|
filter(DUNN_DATE==max(DUNN_DATE)) %>% # To find out the last dunning
|
|
select(DUNN_GPART, DUNN_VKONT, DUNN_BILL_DOC, DUNN_ACTIVITY, DUNN_BILL_DOC, DUNN_DATE) %>%
|
|
unique() %>% mutate(DUNN_VKONT=as.character(DUNN_VKONT))
|
|
|
|
cont.dunn<-last.dunn %>%
|
|
filter(!is.na(DUNN_VKONT)) %>%
|
|
mutate(DUNN_VKONT=as.character(DUNN_VKONT)) %>%
|
|
group_by(DUNN_VKONT) %>%
|
|
filter(DUNN_BILL_DOC==max(DUNN_BILL_DOC)) %>% # To find out the last dunning
|
|
select(DUNN_GPART, DUNN_VKONT, DUNN_BILL_DOC, DUNN_ACTIVITY, DUNN_BILL_DOC,DUNN_DATE) %>%
|
|
unique() # Because there are several dunnings on same date
|
|
|
|
dunn.list.to.use<-
|
|
rbind(no.cont.dunn, cont.dunn) %>%
|
|
group_by(DUNN_GPART) %>%
|
|
filter(DUNN_DATE==max(DUNN_DATE)) %>%
|
|
select(DUNN_GPART, DUNN_VKONT, DUNN_DATE) %>%
|
|
unique()
|
|
dunn.list.to.use.nocont<-dunn.list.to.use %>% filter(is.na(DUNN_VKONT))
|
|
dunn.list.to.use.cont<-dunn.list.to.use %>% filter(!is.na(DUNN_VKONT))
|
|
|
|
oi<-
|
|
oi %>%
|
|
left_join(dunn.list.to.use.cont, by=c("contract_account"="DUNN_VKONT")) %>%
|
|
left_join(dunn.list.to.use.nocont, by=c("business_partner"="DUNN_GPART")) %>%
|
|
mutate(
|
|
dunn_status= case_when(
|
|
is.na(DUNN_DATE.x) & is.na(DUNN_DATE.y) ~ "No Dunning",
|
|
is.na(DUNN_DATE.x) & (due_date>DUNN_DATE.y) ~ "Dunned in Past",
|
|
is.na(DUNN_DATE.y) & (due_date>DUNN_DATE.x) ~ "Dunned in Past",
|
|
TRUE ~ "Dunned"
|
|
)
|
|
) %>%
|
|
select(-c(DUNN_GPART, DUNN_DATE.x,DUNN_VKONT,DUNN_DATE.y))
|
|
|
|
govtnow<-read.csv("./data/govtnow.csv") |> dplyr::select(1:2) |> dplyr::mutate(business_partner=as.character(business_partner))
|
|
noi<-oi |>
|
|
dplyr::inner_join(govtnow, by="business_partner") |>
|
|
dplyr::mutate(govt.status=
|
|
dplyr::case_when(
|
|
contract_type=="Government" & !is.na(Name) ~ "Govt in both",
|
|
contract_type=="Own" & !is.na(Name) ~ "Own in SAP govt in list",
|
|
contract_type=="Street Light" & !is.na(Name) ~ "Street Light in SAP govt in list",
|
|
contract_type=="Government" & is.na(Name) ~ "Govt in SAP not in list",
|
|
contract_type=="Own" & is.na(Name) ~ "Own in SAP not in list",
|
|
contract_type=="Street Light" & is.na(Name) ~ "Street Light in SAP not in list",
|
|
contract_type=="Commercial" & !is.na(Name) ~ "Commercial in SAP govt in list",
|
|
contract_type=="Residential" & !is.na(Name) ~ "Residential in SAP govt in list",
|
|
contract_type=="Industrial" & !is.na(Name) ~ "Industrial in SAP govt in list",
|
|
contract_type=="Commercial" & is.na(Name) ~ "Commercial in SAP not in list",
|
|
contract_type=="Residential" & is.na(Name) ~ "Residential in SAP not in list",
|
|
contract_type=="Industrial" & is.na(Name) ~ "Industrial in SAP not in list"
|
|
|
|
)
|
|
)
|
|
|
|
noi |>
|
|
dplyr::select(business_partner, contract_account, contract_type,govt.status) |> write.csv("")
|
|
oi1<-oi |>
|
|
dplyr::left_join(govtnow, by="business_partner") |>
|
|
dplyr::mutate(new_contract_type=
|
|
dplyr::case_when(
|
|
contract_type=="Government" & !is.na(Name) ~ "Government",
|
|
contract_type=="Own" & !is.na(Name) ~ "Own",
|
|
contract_type=="Street Light" & !is.na(Name) ~ "Government",
|
|
contract_type=="Government" & is.na(Name) ~ "Government",
|
|
contract_type=="Own" & is.na(Name) ~ "Own",
|
|
contract_type=="Street Light" & is.na(Name) ~ "Government",
|
|
contract_type=="Commercial" & !is.na(Name) ~ "Government",
|
|
contract_type=="Residential" & !is.na(Name) ~ "Government",
|
|
contract_type=="Industrial" & !is.na(Name) ~ "Government",
|
|
contract_type=="Commercial" & is.na(Name) ~ "Commercial",
|
|
contract_type=="Residential" & is.na(Name) ~ "Residential",
|
|
contract_type=="Industrial" & is.na(Name) ~ "Industrial"
|
|
|
|
)
|
|
)
|
|
|
|
|
|
|
|
fst::write.fst(oi1,"./data/open_items.fst")
|
|
rm(noi)
|
|
disc
|
|
|
|
```
|
|
|
|
|
|
```{r}
|
|
noi |> dplyr::filter(govt.status=="Commercial in SAP govt in list")
|
|
unique(oi1$new_contract_type)
|
|
unique(oi$o.type)
|
|
unique(oi$contract_type)
|
|
oi1 |>
|
|
dplyr::filter(new_contract_type=="Own") |>
|
|
dplyr::filter(status.x=="Only Active") |>
|
|
group_by(business_partner,contract_account, negative) |>
|
|
summarize(amount=sum(amount)) |>
|
|
pivot_wider(names_from=negative, values_from=amount) |>
|
|
tfrnma()
|
|
|
|
tfrnma<-function(dat){
|
|
if("TRUE" %in% colnames(dat)){
|
|
dat<-dat |> rename(credits=`TRUE`)
|
|
}
|
|
if("FALSE" %in% colnames(dat)){
|
|
dat<-dat |> rename(credits=`FALSE`)
|
|
}
|
|
dat
|
|
}
|
|
|
|
```
|
|
|
|
```{r}
|
|
oi |>
|
|
dplyr::filter(documen_desc=="Installments")
|
|
```
|
|
|
|
|
|
```{r}
|
|
oi
|
|
library(lubridate)
|
|
dead.indi.wt.date<-arch %>% filter(!is.na(Datum.Overlijden.Nr.)) %>% select(c(Id.Nummer,Datum.Overlijden.Nr.)) %>% mutate(e.status="Passed", type="indi")%>% mutate(Id.Nummer=as.character(Id.Nummer)) %>%
|
|
mutate(Datum.Overlijden.Nr.=ymd(Datum.Overlijden.Nr.))
|
|
|
|
|
|
dead.indi.wt.date[is.na(dead.indi.wt.date$Datum.Overlijden.Nr.),]$Datum.Overlijden.Nr.<-as.Date(c("1996-01-01","1993-07-01"))
|
|
|
|
|
|
dead.indi.wt.date<-indi %>% unique() %>% inner_join(dead.indi.wt.date, by=c("V4"="Id.Nummer")) %>% rename(business_partner=V2) %>%
|
|
rename(Year=Datum.Overlijden.Nr.) %>%
|
|
select(business_partner, e.status, Year, type)
|
|
|
|
|
|
left.indi.wt.date<-arch %>% filter(!is.na(Datum.Vertrek.Uit.Curacao.Nr.)) %>% select(Id.Nummer,Datum.Vertrek.Uit.Curacao.Nr.)%>% mutate(e.status="Left", type="indi") %>% mutate(Id.Nummer=as.character(Id.Nummer)) |> mutate(Datum.Vertrek.Uit.Curacao.Nr.=ymd(Datum.Vertrek.Uit.Curacao.Nr.))
|
|
|
|
left.indi.wt.date[is.na(left.indi.wt.date$Datum.Vertrek.Uit.Curacao.Nr.),]$Datum.Vertrek.Uit.Curacao.Nr.<- as.Date(c("2019-01-01","2019-01-01","2019-01-01"))
|
|
|
|
|
|
left.indi.wt.date<-indi %>% unique() %>% inner_join(left.indi.wt.date, by=c("V4"="Id.Nummer")) %>% rename(business_partner=V2) %>%
|
|
rename(Year=Datum.Vertrek.Uit.Curacao.Nr.) %>%
|
|
select(business_partner, e.status, Year, type)
|
|
|
|
ct<-rbind(left.indi.wt.date,dead.indi.wt.date)
|
|
|
|
oi<-oi %>% select(-c(e.status)) %>%
|
|
left_join(ct, by="business_partner") %>%
|
|
mutate(e.status=ifelse(is.na(e.status) | e.status=="No results","active",e.status)) %>% select(-c(type)) |> rename(date.event=Year.y)
|
|
|
|
|
|
oi<-oi |> mutate(date.relaxed=date.event+60) |>
|
|
mutate(rel.status=ifelse(date.relaxed>due_date,"long past","within limit"))
|
|
|
|
fst::write.fst(oi,"./data/open_items.fst")
|
|
|
|
orgs
|
|
disorgs |>
|
|
mutate(Registration.number=as.character(Registration.number)) |>
|
|
inner_join(orgs, by=c("Registration.number"="V4"))
|
|
|
|
oi |>
|
|
filter(e.status %in% c("Passed","Left")) |>
|
|
mutate(age=ifelse(AGE_BUCKET=="5+ years", "More than 5","Less than 5")) |>
|
|
mutate(rel.status=ifelse(rel.status=="long past", "More than 60 days","Less than 60 days")) |>
|
|
group_by(contract_account,rel.status,negative, age, dunn_status) |>
|
|
summarise(amount=sum(amount))
|
|
tidyr::pivot_wider(names_from = c(rel.status,negative), values_from = amount) |>
|
|
rename(`Long Past Credit` = `long past_TRUE`,
|
|
`Within Limit Open` = `within limit_FALSE`,
|
|
`Within Limit Credit` = `within limit_TRUE`,
|
|
`Long Past Open` = `long past_FALSE`)
|
|
|
|
|
|
|
|
disc<-read.csv("./data/coc.csv") %>% unique() %>% select(-X) %>% mutate(Year=ifelse(is.na(Year),0,Year), type=c("org")) %>%
|
|
rename(business_partner=BPC, e.status=Status) %>%
|
|
group_by(business_partner, e.status) %>%
|
|
slice_max(order_by = Year,n=1) %>% select(-Name) %>% mutate(business_partner=as.character(business_partner))
|
|
dead.org<-fst::read.fst("./data/dead.fst") %>% select(V2) %>% rename(business_partner=V2)%>% mutate(e.status="Discontinued", type="org") %>% select(business_partner, e.status, type) %>% mutate(Year=c(0))
|
|
|
|
|
|
|
|
disc.org<-rbind(disc,dead.org) %>% group_by(business_partner) %>% mutate(count=n()) %>%
|
|
group_by(business_partner) %>%
|
|
slice_max(order_by = Year,n=1) %>%
|
|
mutate(count=n()) %>%
|
|
arrange(desc(count), business_partner) %>%
|
|
mutate(rown=row_number()) %>%
|
|
slice_max(order_by = rown,n=1) %>% ungroup() %>% select(-c(count,rown))
|
|
|
|
oi
|
|
|
|
do1<-disc |>
|
|
mutate(Year=ymd(paste0(Year,"-01-01"))) |>
|
|
select(-X) |>
|
|
select(BPC,Year, Status) |>
|
|
rename(Reasonunregistered=Status) |>
|
|
mutate(Status=c("Discontinued"))
|
|
|
|
|
|
disc |> filter(business_partner=="1301003645")
|
|
|
|
```
|
|
|
|
|
|
```{r}
|
|
|
|
do2<-read.csv("./data/inactive.csv") |>
|
|
select(Registration.number,Datediscontinued,Reasonunregistered) |>
|
|
mutate(Registration.number=as.character(Registration.number),Reasonunregistered=as.character(Reasonunregistered)) |>
|
|
mutate(Datediscontinued=dmy(Datediscontinued)) |>
|
|
inner_join(orgs, by=c("Registration.number"="V4")) |>
|
|
select(V2,Datediscontinued,Reasonunregistered) |>
|
|
rename(BPC=V2, Year=Datediscontinued) |>
|
|
mutate(Status="Discontinued")
|
|
|
|
do2 |> filter(BPC=="1301003645")
|
|
|
|
```
|
|
|
|
```{r}
|
|
do3<-disorgs |>
|
|
mutate(Registration.number=as.character(Registration.number)) |>
|
|
inner_join(orgs, by=c("Registration.number"="V4")) |>
|
|
mutate(Datediscontinued=mdy(Datediscontinued)) |>
|
|
select(V2,Datediscontinued,Reasonunregistered) |>
|
|
rename(BPC=V2, Year=Datediscontinued) |>
|
|
mutate(Status="Discontinued")
|
|
|
|
|
|
do3 |> filter(BPC=="1301095174")
|
|
```
|
|
|
|
|
|
```{r}
|
|
do123<-rbind(do1,do2,do3) |>
|
|
group_by(BPC, Status) |>
|
|
slice_max(order_by = Year,n=1) |> unique() |>
|
|
left_join(do3.1) |>
|
|
mutate(Reasonunregistered=ifelse(is.na(Reasonunregistered),"Not Known",Reasonunregistered)) |>
|
|
mutate(type="org") |>
|
|
rename(business_partner=BPC, e.status=Status) |>
|
|
group_by(business_partner) |>
|
|
slice_max(order_by = Year,n=1) |> unique()
|
|
|
|
|
|
|
|
```
|
|
|
|
|
|
```{r}
|
|
ct<-rbind(left.indi.wt.date,dead.indi.wt.date)
|
|
ct<-ct |> mutate(Reasonunregistered="Not relevant for individuals") |>
|
|
select(1,3,5,2,4) |> rbind(do123)
|
|
|
|
ct
|
|
|
|
n.oi<-oi %>% select(-c(e.status, Year.x, date.event, date.relaxed, rel.status, Name)) %>%
|
|
left_join(ct, by="business_partner") %>%
|
|
mutate(e.status=ifelse(is.na(e.status) | e.status=="No results","active",e.status)) %>% select(-c(type)) |> rename(date.event=Year) |>
|
|
mutate(date.relaxed=date.event+60) |>
|
|
mutate(rel.status=ifelse(date.relaxed>due_date,"long past","within limit"))
|
|
|
|
|
|
fst::write.fst(n.oi,"./data/open_items_new.fst")
|
|
unique(n.oi$e.status)
|
|
unique(n.oi$Reasonunregistered)
|
|
```
|
|
|
|
|
|
|
|
```{r}
|
|
arch |> filter(Id.Nummer %in% c("1968052211","1972090816","1976052001"))
|
|
oi[oi$contract_account=="13090404",]
|
|
```
|
|
|
|
```{r}
|
|
oi |>
|
|
filter(o.type=="Real") |>
|
|
filter(negative==T) |>
|
|
group_by(business_partner, contract_account, bp_category, status.x) |>
|
|
summarize(amount=sum(amount))
|
|
```
|
|
|
|
|
|
|
|
```{r}
|
|
oi |>
|
|
ungroup() |>
|
|
ungroup() |>
|
|
group_by(o.type, negative) |>
|
|
mutate(amount=sum(amount))
|
|
```
|
|
|
|
|
|
|
|
## Including Plots
|
|
|
|
You can also embed plots, for example:
|
|
|
|
```{r pressure, echo=FALSE}
|
|
con <- DBI::dbConnect(RPostgres::Postgres(),dbname = 'postgres',
|
|
host = 'lanubiadsdbpgsql.postgres.database.azure.com', # i.e. 'ec2-54-83-201-96.compute-1.amazonaws.com'
|
|
port = 5432, # or any other port specified by your DBA
|
|
user = 'lanubiadsdbpgsql@lanubiadsdbpgsql',
|
|
password = 'LaNubia@2021',
|
|
base::list(sslmode="require", connect_timeout="10"),
|
|
service = NULL)
|
|
|
|
DBI::dbListTables(con)
|
|
|
|
DBI::dbWriteTable(con, "open_items", oi)
|
|
|
|
```
|
|
|
|
Note that the `echo = FALSE` parameter was added to the code chunk to prevent printing of the R code that generated the plot.
|
|
|