HTML2Text service

This service returns string with visible words in the text part of the HTML

Input

HTML (string)

HTML text to analyze

RemoveDelimiter (boolean)

'true' to remove all delimiters from the list of words, words are separated by space character

Output

HTML2TextResult (string)

A string that represents all visible words in the HTML

Description

This service analyzes input HTML string and returns all visible words. It's possible to preserve or not all delimiters in the source HTML.

WSDL

WSDL: http://rainbow.vse.cz/services/HTML2TextService

There will be nicely formatted WSDL listing in a future. For now just plain listing.

<?xml version="1.0" encoding="utf-8"?>
<wsdl:definitions xmlns:http="http://schemas.xmlsoap.org/wsdl/http/" xmlns:soap="http://schemas.xmlsoap.org/wsdl/soap/" xmlns:s="http://www.w3.org/2001/XMLSchema" xmlns:soapenc="http://schemas.xmlsoap.org/soap/encoding/" xmlns:tns="urn:x-rainbow:services:html2text" xmlns:tm="http://microsoft.com/wsdl/mime/textMatching/" xmlns:mime="http://schemas.xmlsoap.org/wsdl/mime/" targetNamespace="urn:x-rainbow:services:html2text" xmlns:wsdl="http://schemas.xmlsoap.org/wsdl/">
  <wsdl:types>
    <s:schema elementFormDefault="qualified" targetNamespace="urn:x-rainbow:services:html2text">
      <s:element name="HTML2Text">
        <s:complexType>
          <s:sequence>
            <s:element minOccurs="0" maxOccurs="1" name="HTML" type="s:string" />
            <s:element minOccurs="1" maxOccurs="1" name="RemoveDelimiter" type="s:boolean" />
          </s:sequence>
        </s:complexType>
      </s:element>
      <s:element name="HTML2TextResponse">
        <s:complexType>
          <s:sequence>
            <s:element minOccurs="0" maxOccurs="1" name="HTML2TextResult" type="s:string" />
          </s:sequence>
        </s:complexType>
      </s:element>
      <s:element name="string" nillable="true" type="s:string" />
    </s:schema>
  </wsdl:types>
  <wsdl:message name="HTML2TextSoapIn">
    <wsdl:part name="parameters" element="tns:HTML2Text" />
  </wsdl:message>
  <wsdl:message name="HTML2TextSoapOut">
    <wsdl:part name="parameters" element="tns:HTML2TextResponse" />
  </wsdl:message>
  <wsdl:message name="HTML2TextHttpPostIn">
    <wsdl:part name="HTML" type="s:string" />
    <wsdl:part name="RemoveDelimiter" type="s:string" />
  </wsdl:message>
  <wsdl:message name="HTML2TextHttpPostOut">
    <wsdl:part name="Body" element="tns:string" />
  </wsdl:message>
  <wsdl:portType name="HTML2TextSoap">
    <wsdl:operation name="HTML2Text">
      <documentation xmlns="http://schemas.xmlsoap.org/wsdl/">This service returns string with visible words in the text part of the HTML</documentation>
      <wsdl:input message="tns:HTML2TextSoapIn" />
      <wsdl:output message="tns:HTML2TextSoapOut" />
    </wsdl:operation>
  </wsdl:portType>
  <wsdl:portType name="HTML2TextHttpPost">
    <wsdl:operation name="HTML2Text">
      <documentation xmlns="http://schemas.xmlsoap.org/wsdl/">This service returns string with visible words in the text part of the HTML</documentation>
      <wsdl:input message="tns:HTML2TextHttpPostIn" />
      <wsdl:output message="tns:HTML2TextHttpPostOut" />
    </wsdl:operation>
  </wsdl:portType>
  <wsdl:binding name="HTML2TextSoap" type="tns:HTML2TextSoap">
    <soap:binding transport="http://schemas.xmlsoap.org/soap/http" style="document" />
    <wsdl:operation name="HTML2Text">
      <soap:operation soapAction="urn:x-rainbow:services:html2text/HTML2Text" style="document" />
      <wsdl:input>
        <soap:body use="literal" />
      </wsdl:input>
      <wsdl:output>
        <soap:body use="literal" />
      </wsdl:output>
    </wsdl:operation>
  </wsdl:binding>
  <wsdl:binding name="HTML2TextHttpPost" type="tns:HTML2TextHttpPost">
    <http:binding verb="POST" />
    <wsdl:operation name="HTML2Text">
      <http:operation location="/HTML2Text" />
      <wsdl:input>
        <mime:content type="application/x-www-form-urlencoded" />
      </wsdl:input>
      <wsdl:output>
        <mime:mimeXml part="Body" />
      </wsdl:output>
    </wsdl:operation>
  </wsdl:binding>
  <wsdl:service name="HTML2Text">
    <documentation xmlns="http://schemas.xmlsoap.org/wsdl/">Services related to SPAM classification and conversion from HTML to text</documentation>
    <wsdl:port name="HTML2TextSoap" binding="tns:HTML2TextSoap">
      <soap:address location="http://vyuka.janmach.cz/services/html2text/html2text.asmx" />
    </wsdl:port>
    <wsdl:port name="HTML2TextHttpPost" binding="tns:HTML2TextHttpPost">
      <http:address location="http://vyuka.janmach.cz/services/html2text/html2text.asmx" />
    </wsdl:port>
  </wsdl:service>
</wsdl:definitions>