blob: 597c262484e9c6c426167ba0c335682296cabe7e [file] [log] [blame]
//========================================================================
//
// This file comes from pdftohtml project
// http://pdftohtml.sourceforge.net
//
// Copyright from:
// Gueorgui Ovtcharov
// Rainer Dorsch <http://www.ra.informatik.uni-stuttgart.de/~rainer/>
// Mikhail Kruk <meshko@cs.brandeis.edu>
//
//========================================================================
//========================================================================
//
// Modified under the Poppler project - http://poppler.freedesktop.org
//
// All changes made under the Poppler project to this file are licensed
// under GPL version 2 or later
//
// Copyright (C) 2007, 2010, 2012, 2018 Albert Astals Cid <aacid@kde.org>
// Copyright (C) 2008 Boris Toloknov <tlknv@yandex.ru>
// Copyright (C) 2008 Tomas Are Haavet <tomasare@gmail.com>
// Copyright (C) 2010 OSSD CDAC Mumbai by Leena Chourey (leenac@cdacmumbai.in) and Onkar Potdar (onkar@cdacmumbai.in)
// Copyright (C) 2011 Joshua Richardson <jric@chegg.com>
// Copyright (C) 2011 Stephen Reichling <sreichling@chegg.com>
// Copyright (C) 2012 Igor Slepchin <igor.slepchin@gmail.com>
// Copyright (C) 2012 Luis Parravicini <lparravi@gmail.com>
// Copyright (C) 2013 Julien Nabet <serval2412@yahoo.fr>
// Copyright (C) 2017 Jason Crain <jason@inspiresomeone.us>
// Copyright (C) 2018 Klarälvdalens Datakonsult AB, a KDAB Group company, <info@kdab.com>. Work sponsored by the LiMux project of the city of Munich
// Copyright (C) 2018 Steven Boswell <ulatekh@yahoo.com>
// Copyright (C) 2018 Adam Reichold <adam.reichold@t-online.de>
//
// To see a description of the changes please see the Changelog file that
// came with your tarball or type make ChangeLog if you are building from git
//
//========================================================================
#include "HtmlFonts.h"
#include "HtmlUtils.h"
#include "GlobalParams.h"
#include "UnicodeMap.h"
#include "GfxFont.h"
#include <stdio.h>
namespace
{
const char* const defaultFamilyName = "Times";
const char* const styleSuffixes[] = {
"-Regular",
"-Bold",
"-BoldOblique",
"-BoldItalic",
"-Oblique",
"-Italic",
"-Roman",
};
void removeStyleSuffix(std::string& familyName) {
for (const char* const styleSuffix : styleSuffixes) {
auto pos = familyName.rfind(styleSuffix);
if (pos != std::string::npos) {
familyName.resize(pos);
return;
}
}
}
}
#define xoutRound(x) ((int)(x + 0.5))
extern bool xml;
extern bool fontFullName;
HtmlFontColor::HtmlFontColor(GfxRGB rgb){
r=static_cast<int>(rgb.r/65535.0*255.0);
g=static_cast<int>(rgb.g/65535.0*255.0);
b=static_cast<int>(rgb.b/65535.0*255.0);
if (!(Ok(r)&&Ok(b)&&Ok(g))) {
if (!globalParams->getErrQuiet()) fprintf(stderr, "Error : Bad color (%d,%d,%d) reset to (0,0,0)\n", r, g, b);
r=0;g=0;b=0;
}
}
GooString *HtmlFontColor::convtoX(unsigned int xcol) const{
GooString *xret=new GooString();
char tmp;
unsigned int k;
k = (xcol/16);
if (k<10) tmp=(char) ('0'+k); else tmp=(char)('a'+k-10);
xret->append(tmp);
k = (xcol%16);
if (k<10) tmp=(char) ('0'+k); else tmp=(char)('a'+k-10);
xret->append(tmp);
return xret;
}
GooString *HtmlFontColor::toString() const{
GooString *tmp=new GooString("#");
GooString *tmpr=convtoX(r);
GooString *tmpg=convtoX(g);
GooString *tmpb=convtoX(b);
tmp->append(tmpr);
tmp->append(tmpg);
tmp->append(tmpb);
delete tmpr;
delete tmpg;
delete tmpb;
return tmp;
}
HtmlFont::HtmlFont(GfxFont *font, int _size, GfxRGB rgb){
color=HtmlFontColor(rgb);
lineSize = -1;
size=(_size-1);
italic = false;
bold = false;
rotOrSkewed = false;
if (font->isBold() || font->getWeight() >= GfxFont::W700) bold=true;
if (font->isItalic()) italic=true;
if (const GooString *fontname = font->getName()){
FontName = new GooString(fontname);
GooString fontnameLower(fontname);
fontnameLower.lowerCase();
if (!bold && strstr(fontnameLower.c_str(),"bold")) {
bold=true;
}
if (!italic &&
(strstr(fontnameLower.c_str(),"italic")||
strstr(fontnameLower.c_str(),"oblique"))) {
italic=true;
}
familyName = fontname->c_str();
removeStyleSuffix(familyName);
} else {
FontName = new GooString(defaultFamilyName);
familyName = defaultFamilyName;
}
rotSkewMat[0] = rotSkewMat[1] = rotSkewMat[2] = rotSkewMat[3] = 0;
}
HtmlFont::HtmlFont(const HtmlFont& x){
size=x.size;
lineSize=x.lineSize;
italic=x.italic;
bold=x.bold;
familyName=x.familyName;
color=x.color;
FontName=new GooString(x.FontName);
rotOrSkewed = x.rotOrSkewed;
memcpy(rotSkewMat, x.rotSkewMat, sizeof(rotSkewMat));
}
HtmlFont::~HtmlFont(){
delete FontName;
}
HtmlFont& HtmlFont::operator=(const HtmlFont& x){
if (this==&x) return *this;
size=x.size;
lineSize=x.lineSize;
italic=x.italic;
bold=x.bold;
familyName=x.familyName;
color=x.color;
delete FontName;
FontName=new GooString(x.FontName);
return *this;
}
/*
This function is used to compare font uniquely for insertion into
the list of all encountered fonts
*/
bool HtmlFont::isEqual(const HtmlFont& x) const{
return (size==x.size) &&
(lineSize==x.lineSize) &&
(FontName->cmp(x.FontName) == 0) && (bold==x.bold) && (italic==x.italic) &&
(color.isEqual(x.getColor())) && isRotOrSkewed() == x.isRotOrSkewed() &&
(!isRotOrSkewed() || rot_matrices_equal(getRotMat(), x.getRotMat()));
}
/*
This one is used to decide whether two pieces of text can be joined together
and therefore we don't care about bold/italics properties
*/
bool HtmlFont::isEqualIgnoreBold(const HtmlFont& x) const{
return ((size==x.size) &&
(familyName == x.familyName) &&
(color.isEqual(x.getColor())));
}
GooString* HtmlFont::getFontName(){
return new GooString(familyName);
}
GooString* HtmlFont::getFullName(){
return new GooString(FontName);
}
// this method if plain wrong todo
GooString* HtmlFont::HtmlFilter(const Unicode* u, int uLen) {
GooString *tmp = new GooString();
UnicodeMap *uMap;
char buf[8];
int n;
// get the output encoding
if (!(uMap = globalParams->getTextEncoding())) {
return tmp;
}
for (int i = 0; i < uLen; ++i) {
// skip control characters. W3C disallows them and they cause a warning
// with PHP.
if (u[i] <= 31 && u[i] != '\t')
continue;
switch (u[i])
{
case '"': tmp->append("&#34;"); break;
case '&': tmp->append("&amp;"); break;
case '<': tmp->append("&lt;"); break;
case '>': tmp->append("&gt;"); break;
case ' ': case '\t': tmp->append( !xml && ( i+1 >= uLen || !tmp->getLength() || tmp->getChar( tmp->getLength()-1 ) == ' ' ) ? "&#160;" : " " );
break;
default:
{
// convert unicode to string
if ((n = uMap->mapUnicode(u[i], buf, sizeof(buf))) > 0) {
tmp->append(buf, n);
}
}
}
}
uMap->decRefCnt();
return tmp;
}
HtmlFontAccu::HtmlFontAccu(){
accu=new std::vector<HtmlFont>();
}
HtmlFontAccu::~HtmlFontAccu(){
if (accu) delete accu;
}
int HtmlFontAccu::AddFont(const HtmlFont& font){
std::vector<HtmlFont>::iterator i;
for (i=accu->begin();i!=accu->end();++i)
{
if (font.isEqual(*i))
{
return (int)(i-(accu->begin()));
}
}
accu->push_back(font);
return (accu->size()-1);
}
// get CSS font definition for font #i
GooString* HtmlFontAccu::CSStyle(int i, int j){
GooString *tmp=new GooString();
GooString *iStr=GooString::fromInt(i);
GooString *jStr=GooString::fromInt(j);
std::vector<HtmlFont>::iterator g=accu->begin();
g+=i;
HtmlFont font=*g;
GooString *Size=GooString::fromInt(font.getSize());
GooString *colorStr=font.getColor().toString();
GooString *fontName=(fontFullName ? font.getFullName() : font.getFontName());
GooString *lSize;
if(!xml){
tmp->append(".ft");
tmp->append(jStr);
tmp->append(iStr);
tmp->append("{font-size:");
tmp->append(Size);
if( font.getLineSize() != -1 && font.getLineSize() != 0 )
{
lSize = GooString::fromInt(font.getLineSize());
tmp->append("px;line-height:");
tmp->append(lSize);
delete lSize;
}
tmp->append("px;font-family:");
tmp->append(fontName); //font.getFontName());
tmp->append(";color:");
tmp->append(colorStr);
// if there is rotation or skew, include the matrix
if (font.isRotOrSkewed()) {
const double * const text_mat = font.getRotMat();
GooString matrix_str(" matrix(");
matrix_str.appendf("{0:10.10g}, {1:10.10g}, {2:10.10g}, {3:10.10g}, 0, 0)",
text_mat[0], text_mat[1], text_mat[2], text_mat[3]);
tmp->append(";-moz-transform:");
tmp->append(&matrix_str);
tmp->append(";-webkit-transform:");
tmp->append(&matrix_str);
tmp->append(";-o-transform:");
tmp->append(&matrix_str);
tmp->append(";-ms-transform:");
tmp->append(&matrix_str);
// Todo: 75% is a wild guess that seems to work pretty well;
// We probably need to calculate the real percentage
// Based on the characteristic baseline and bounding box of current font
// PDF origin is at baseline
tmp->append(";-moz-transform-origin: left 75%");
tmp->append(";-webkit-transform-origin: left 75%");
tmp->append(";-o-transform-origin: left 75%");
tmp->append(";-ms-transform-origin: left 75%");
}
tmp->append(";}");
}
if (xml) {
tmp->append("<fontspec id=\"");
tmp->append(iStr);
tmp->append("\" size=\"");
tmp->append(Size);
tmp->append("\" family=\"");
tmp->append(fontName);
tmp->append("\" color=\"");
tmp->append(colorStr);
tmp->append("\"/>");
}
delete fontName;
delete colorStr;
delete jStr;
delete iStr;
delete Size;
return tmp;
}