-
Notifications
You must be signed in to change notification settings - Fork 0
/
umf_3_flona_amapa.R
51 lines (38 loc) · 1.82 KB
/
umf_3_flona_amapa.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
library(pdftools)
library(stringr)
library(dplyr, warn.conflicts = FALSE)
library(readr)
library(sf)
## Read pdf files and convert them to text
umf_pdf <- './data/ContratoConcesso012021_umf1_flonas_amapa.pdf'
umf_txt <- pdf_text(umf_pdf)
cat(umf_txt[25]) # view a page text
## Subset pages by UMF
umf3 <- umf_txt[24:25] # UMF 3 24-25
cat(umf3)
## Regex to extract the name of the vertices
unlist(str_extract_all(umf3, '\\bP-\\d{2}+'))
vertex <- c(paste0('P-0', 1:9), paste0('P-', 10:32))
## Regex to extract longitude and latitude UTM
# Check out if the regex get all the 63th vertices to east and north coordinates
summary(unlist(str_extract_all(umf3, '\\bE\\s\\d{3}\\.\\d{3},\\d{2}m')))
# Did not extract east coordinate from the vertex P-42
summary(unlist(str_extract_all(umf3, '\\bN\\s\\d{3}\\.\\d{3},\\d{2}m')))
east <- unlist(str_extract_all(umf3, '\\bE\\s\\d{3}\\.\\d{3},\\d{2}m'))
north <- unlist(str_extract_all(umf3, '\\bN\\s\\d{3}\\.\\d{3},\\d{2}m'))
## Set a dataframe and save as csv
df <- data.frame(vértice = vertex, east = east, north = north) %>%
mutate(east = gsub('m', '', east)) %>%
mutate(east = parse_number(east, locale = locale(decimal_mark = ',',
grouping_mark = '.'))) %>%
mutate(north = gsub('m', '', north)) %>%
mutate(north = parse_number(north, locale = locale(decimal_mark = ',',
grouping_mark = '.')))
write.csv(df,
'./output/vertices_umf3_flona_amapa.csv',
row.names = FALSE,
fileEncoding = 'UTF-8')
## Convert the dataframe to sf object and as shapefile
shp_points <- st_as_sf(df, coords = c('east', 'north'), crs = '31976')
st_crs(shp_points) <- 'EPSG:31976'
st_write(shp_points, './output/vertices_umf_3_flonas_amapa.shp')