Skip to content

Commit

Permalink
English tokenization models
Browse files Browse the repository at this point in the history
  • Loading branch information
victorbocharov committed Jun 14, 2019
1 parent b1b6db6 commit f74a445
Show file tree
Hide file tree
Showing 5 changed files with 62 additions and 0 deletions.
15 changes: 15 additions & 0 deletions CMakeLists.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,15 @@
cmake_minimum_required(VERSION 3.12.1)

set(CPACK_ARCHIVE_COMPONENT_INSTALL ON)
set(CPACK_COMPONENTS_GROUPING IGNORE)
set(CPACK_DEB_COMPONENT_INSTALL ON)
set(CPACK_GENERATOR "DEB")
set(CPACK_DEBIAN_PACKAGE_MAINTAINER "LIMA Publisher")
set(CPACK_PACKAGE_NAME lima-deep-models)
set(CPACK_PACKAGE_VERSION "0.1.1")
set(CPACK_DEBIAN_PACKAGE_ARCHITECTURE "all")
set(CPACK_DEBIAN_FILE_NAME DEB-DEFAULT)

include(CPack)

add_subdirectory(TensorFlowTokenizer)
5 changes: 5 additions & 0 deletions TensorFlowTokenizer/CMakeLists.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
cmake_minimum_required(VERSION 3.12.1)

cpack_add_component_group(Tokenizer)

add_subdirectory(eng.ud)
4 changes: 4 additions & 0 deletions TensorFlowTokenizer/eng.ud/CMakeLists.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,4 @@
cmake_minimum_required(VERSION 3.12.1)

add_subdirectory(ewt)
add_subdirectory(ud23-all)
19 changes: 19 additions & 0 deletions TensorFlowTokenizer/eng.ud/ewt/CMakeLists.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,19 @@
cmake_minimum_required(VERSION 3.12.1)

install(
FILES
UD_English-EWT.conf
UD_English-EWT.model
COMPONENT
tokenizer-eng.ud-ewt
DESTINATION
/share/apps/lima/resources/TensorFlowTokenizer/eng.ud/ewt/
)

cpack_add_component(tokenizer-eng.ud-ewt
DISPLAY_NAME
"UD English / EWT corpus"
GROUP
Tokenizer
)

19 changes: 19 additions & 0 deletions TensorFlowTokenizer/eng.ud/ud23-all/CMakeLists.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,19 @@
cmake_minimum_required(VERSION 3.12.1)

install(
FILES
UD_English-ALL.conf
UD_English-ALL.model
COMPONENT
tokenizer-eng.ud-all
DESTINATION
/share/apps/lima/resources/TensorFlowTokenizer/eng.ud/all/
)

cpack_add_component(tokenizer-eng.ud-all
DISPLAY_NAME
"UD English / All corpora"
GROUP
Tokenizer
)

0 comments on commit f74a445

Please sign in to comment.