From 4eef94b1217a82eb979242dd3e06d8a4b6255e6e Mon Sep 17 00:00:00 2001 From: Hieu Hoang Date: Thu, 31 May 2012 17:24:06 +0100 Subject: move c++ code out of /script/ to / --- phrase-extract/XmlTree.h | 36 ++++++++++++++++++++++++++++++++++++ 1 file changed, 36 insertions(+) create mode 100644 phrase-extract/XmlTree.h (limited to 'phrase-extract/XmlTree.h') diff --git a/phrase-extract/XmlTree.h b/phrase-extract/XmlTree.h new file mode 100644 index 000000000..7e6bbecea --- /dev/null +++ b/phrase-extract/XmlTree.h @@ -0,0 +1,36 @@ +// $Id: XmlOption.cpp 1960 2008-12-15 12:52:38Z phkoehn $ +// vim:tabstop=2 + +/*********************************************************************** + Moses - factored phrase-based language decoder + Copyright (C) 2006 University of Edinburgh + + This library is free software; you can redistribute it and/or + modify it under the terms of the GNU Lesser General Public + License as published by the Free Software Foundation; either + version 2.1 of the License, or (at your option) any later version. + + This library is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + Lesser General Public License for more details. + + You should have received a copy of the GNU Lesser General Public + License along with this library; if not, write to the Free Software + Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA + ***********************************************************************/ + +#pragma once +#include +#include +#include +#include +#include "SyntaxTree.h" + +std::string ParseXmlTagAttribute(const std::string& tag,const std::string& attributeName); +std::string Trim(const std::string& str, const std::string dropChars = " \t\n\r"); +std::string TrimXml(const std::string& str); +bool isXmlTag(const std::string& tag); +std::vector TokenizeXml(const std::string& str); +bool ProcessAndStripXMLTags(std::string &line, SyntaxTree &tree, std::set< std::string > &labelCollection, std::map< std::string, int > &topLabelCollection ); +std::string unescape(const std::string &str); -- cgit v1.2.3