CMakeLists.txt
5.14 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
cmake_minimum_required (VERSION 2.8)
project (Morfeusz)
set (Morfeusz_VERSION_MAJOR 2)
set (Morfeusz_VERSION_MINOR 0)
set (Morfeusz_VERSION_PATCH 0)
set (CMAKE_BUILD_TYPE "Debug")
enable_testing()
##### initialize some vars #####
# ARCHITECTURE
if ("${CMAKE_SYSTEM_PROCESSOR}" STREQUAL "x86_64")
set(ARCHITECTURE "amd64")
elseif ("${CMAKE_SYSTEM_PROCESSOR}" STREQUAL "x86")
set(ARCHITECTURE "i386")
elseif ("${CMAKE_SYSTEM_PROCESSOR}" STREQUAL "")
message (FATAL_ERROR "CMAKE_SYSTEM_PROCESSOR is not set (should be x86 or x86_64)")
else ()
message (FATAL_ERROR "Unsupported platform: ${CMAKE_SYSTEM_PROCESSOR}")
endif ()
# PROJECT_VERSION
set (PROJECT_VERSION "${Morfeusz_VERSION_MAJOR}.${Morfeusz_VERSION_MINOR}.${Morfeusz_VERSION_PATCH}")
### USER DEFINED VARIABLES
# INPUT_DICTIONARY_CPP
set (INPUT_DICTIONARY_CPP "${CMAKE_CURRENT_BINARY_DIR}/default_fsa.cpp")
if ("${INPUT_DICTIONARY}" STREQUAL "")
if ("${EMPTY_INPUT_DICTIONARY}" STREQUAL "TRUE")
set (INPUT_DICTIONARY ${PROJECT_SOURCE_DIR}/input/empty.txt)
else ()
set (INPUT_DICTIONARY ${PROJECT_SOURCE_DIR}/input/polimorf.txt)
endif ()
endif ()
# INPUT_TAGSET
if ("${INPUT_TAGSET}" STREQUAL "")
set (INPUT_TAGSET ${PROJECT_SOURCE_DIR}/input/polimorf.tagset)
endif ()
message ("Will use ${INPUT_DICTIONARY} as default input dictionary and ${INPUT_TAGSET} as tagset")
# TARGET_DIR
if ("${TARGET_DIR}" STREQUAL "")
set (TARGET_DIR "${PROJECT_BINARY_DIR}")
endif ()
### Compilation and linking flags
if (${CMAKE_SYSTEM_NAME} MATCHES "Linux")
set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -std=c++98 -Wall -pedantic -Wcast-align -Wextra -Wmissing-noreturn -Wconversion -Wcast-qual -Wcast-align -O2")
elseif (${CMAKE_SYSTEM_NAME} MATCHES "Windows")
set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -std=c++0x -Wall -O2")
set (CMAKE_SHARED_LIBRARY_PREFIX "")
# here is some magic - must statically link libstdc++ and libgcc
# but exclude libgcc_eh.a as it causes "multiple definition of (...)" errors
set (CMAKE_SHARED_LINKER_FLAGS "-s -Os -static-libstdc++ -static-libgcc -Wl,--exclude-libs,libgcc_eh.a")
set (CMAKE_EXE_LINKER_FLAGS "-s -Os -static-libstdc++ -static-libgcc")
endif ()
########## Configure CPack ##########
# general
set (CPACK_PACKAGE_FILE_NAME "morfeusz-${PROJECT_VERSION}-${CMAKE_SYSTEM_NAME}-${ARCHITECTURE}")
set (CPACK_PACKAGE_VENDOR "Michał Lenart")
set (CPACK_PACKAGE_CONTACT "michal.lenart@ipipan.waw.pl")
set (CPACK_PACKAGE_DESCRIPTION_SUMMARY "Morphological analyzer for Polish language.")
set (CPACK_OUTPUT_FILE_PREFIX "${TARGET_DIR}")
if (${CMAKE_SYSTEM_NAME} MATCHES "Linux")
set (CPACK_GENERATOR "DEB" "STGZ" "TGZ")
#debian
set (CPACK_DEBIAN_PACKAGE_NAME "morfeusz")
set (CPACK_DEBIAN_PACKAGE_MAINTAINER "${CPACK_PACKAGE_CONTACT}")
set (CPACK_DEBIAN_PACKAGE_DEPENDS "libstdc++6 (>= 4.6)")
elseif (${CMAKE_SYSTEM_NAME} MATCHES "Windows")
if (${ARCHITECTURE} MATCHES "amd64")
set (CPACK_GENERATOR "NSIS64" "TGZ")
else ()
set (CPACK_GENERATOR "NSIS" "TGZ")
endif ()
elseif (${CMAKE_SYSTEM_NAME} MATCHES "Darwin")
set (CPACK_GENERATOR "STGZ" "TGZ")
endif ()
include (CPack)
##### END initialize some vars #####
file (COPY fsabuilder testfiles input DESTINATION .)
configure_file (
"${PROJECT_SOURCE_DIR}/morfeusz/MorfeuszConfig.hpp.in"
"${PROJECT_BINARY_DIR}/morfeusz/MorfeuszConfig.hpp"
)
###### add main sources ########
include_directories("${PROJECT_BINARY_DIR}" )
add_subdirectory (morfeusz)
add_subdirectory (fsabuilder)
########## add tests ##########
macro (test_build_and_recognize fname method)
add_test (TestBuild-${method}-${fname} python fsabuilder/buildfsa.py --analyzer -i testfiles/${fname} -o /tmp/test-${method}-${fname}.fsa --tagset-file=testfiles/polimorf.tagset --output-format=BINARY --serialization-method=${method})
add_test (TestRecognize-${method}-${fname} morfeusz/test_recognize_dict /tmp/test-${method}-${fname}.fsa testfiles/${fname})
# add_test (TestNOTRecognize-${method}-${fname} fsa/test_not_recognize /tmp/test-${method}-${fname}.fsa testfiles/out_of_dict)
# add_test (TestSpeed-${method}-${fname} fsa/test_speed /tmp/test-${method}-${fname}.fsa testfiles/speed_test_data)
endmacro ()
macro (test_result_equals inputFilename requiredOutputFilename encoding)
# add_test (TestBuild4ResultEquals-${dictFilename}-${requiredOutputFilename} python fsabuilder/fsa/buildfsa.py -i ${dictFilename} -o /tmp/test.fsa --tagset-file=testfiles/polimorf.tagset --output-format=BINARY --serialization-method=SIMPLE)
add_test (TestResultEquals-${inputFilename}-${requiredOutputFilename} morfeusz/test_result_equals ${inputFilename} ${requiredOutputFilename} ${encoding})
endmacro ()
test_build_and_recognize(PoliMorfSmall.tab SIMPLE)
test_build_and_recognize(PoliMorfSmall.tab V1)
test_build_and_recognize(PoliMorfSmall.tab V2)
test_result_equals (testfiles/test1.txt testfiles/test1.txt.out UTF8)
test_result_equals (testfiles/test1.txt.ISO8859-2 testfiles/test1.txt.out.ISO8859-2 ISO8859_2)
test_result_equals (testfiles/test1.txt.CP1250 testfiles/test1.txt.out.CP1250 CP1250)
test_result_equals (testfiles/test1.txt.CP852 testfiles/test1.txt.out.CP852 CP852)