#ifndef _RULES_H_ #define _RULES_H_ #include #include #include "chunk.h" namespace rmmseg { template void take_highest(std::vector &chunks, const Cmp &cmp) { unsigned int i = 1, j; for (j = 1; j < chunks.size(); ++j) { int rlt = cmp(chunks[j], chunks[0]); if (rlt > 0) i = 0; if (rlt >= 0) std::swap(chunks[i++], chunks[j]); } chunks.erase(chunks.begin() + i, chunks.end()); } struct MMCmp_t { int operator()(const Chunk &a, const Chunk &b) const { return a.total_length() - b.total_length(); } } MMCmp; void mm_filter(std::vector &chunks) { take_highest(chunks, MMCmp); } struct LAWLCmp_t { int operator()(const Chunk &a, const Chunk &b) const { double rlt = a.average_length() - b.average_length(); if (rlt == 0) return 0; if (rlt > 0) return 1; return -1; } } LAWLCmp; void lawl_filter(std::vector &chunks) { take_highest(chunks, LAWLCmp); } struct SVWLCmp_t { int operator()(const Chunk &a, const Chunk &b) const { double rlt = a.variance() - b.variance(); if (rlt == 0) return 0; if (rlt < 0) return 1; return -1; } } SVWLCmp; void svwl_filter(std::vector &chunks) { take_highest(chunks, SVWLCmp); } struct LSDMFOCWCmp_t { int operator()(const Chunk &a, const Chunk &b) const { return a.degree_of_morphemic_freedom() - b.degree_of_morphemic_freedom(); } } LSDMFOCWCmp; void lsdmfocw_filter(std::vector &chunks) { take_highest(chunks, LSDMFOCWCmp); } } #endif /* _RULES_H_ */