language.py 1.4 KB

123456789101112131415161718192021222324252627282930313233343536373839
  1. #!/usr/bin/env python
  2. # encoding: utf-8
  3. # Licensed to the Apache Software Foundation (ASF) under one or more
  4. # contributor license agreements. See the NOTICE file distributed with
  5. # this work for additional information regarding copyright ownership.
  6. # The ASF licenses this file to You under the Apache License, Version 2.0
  7. # (the "License"); you may not use this file except in compliance with
  8. # the License. You may obtain a copy of the License at
  9. #
  10. # http://www.apache.org/licenses/LICENSE-2.0
  11. #
  12. # Unless required by applicable law or agreed to in writing, software
  13. # distributed under the License is distributed on an "AS IS" BASIS,
  14. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  15. # See the License for the specific language governing permissions and
  16. # limitations under the License.
  17. #
  18. from .tika import detectLang1, callServer, ServerEndpoint
  19. def from_file(filename):
  20. '''
  21. Detects language of the file
  22. :param filename: path to file whose language needs to be detected
  23. :return:
  24. '''
  25. jsonOutput = detectLang1('file', filename)
  26. return jsonOutput[1]
  27. def from_buffer(string):
  28. '''
  29. Detects language of content in the buffer
  30. :param string: buffered data
  31. :return:
  32. '''
  33. status, response = callServer('put', ServerEndpoint, '/language/string', string,
  34. {'Accept': 'text/plain'}, False)
  35. return response