// Copyright (c) 2006-2009 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #include "encodings/compact_lang_det/win/cld_htmlutils.h" // Src points to '&' // Writes entity value to dst. Returns take(src), put(dst) byte counts void EntityToBuffer(const char* src, int len, char* dst, int* tlen, int* plen) { // On Windows we do not have to do anything, browser expands HTML entities // for us, so text we're retrieving from it is ready for translation as it is. // But: // This is a temporary solution to let us continue the development without // having a real DOM text scraping in place. For now the full HTML is fed // to CLD for language detection and just ignoring entities is good enough // for testing. Later entities will be expanded by browser itself. // Skip entity in the source. *tlen = 1; do { ++src; ++*tlen; } while (*src && *src != ';'); // Report a bogus entity (space). *dst = ' '; *plen = 1; }