Source code for camcops_server.cc_modules.cc_convert
"""
camcops_server/cc_modules/cc_convert.py
===============================================================================
Copyright (C) 2012, University of Cambridge, Department of Psychiatry.
Created by Rudolf Cardinal (rnc1001@cam.ac.uk).
This file is part of CamCOPS.
CamCOPS is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
CamCOPS is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with CamCOPS. If not, see <https://www.gnu.org/licenses/>.
===============================================================================
**Miscellaneous conversion functions.**
"""
import logging
import re
from typing import Any, List
from cardinal_pythonlib.convert import (
base64_64format_decode,
base64_64format_encode,
hex_xformat_decode,
REGEX_BASE64_64FORMAT,
REGEX_HEX_XFORMAT,
)
from cardinal_pythonlib.logs import BraceStyleAdapter
from cardinal_pythonlib.sql.literals import (
gen_items_from_sql_csv,
SQUOTE,
sql_dequote_string,
sql_quote_string,
)
from cardinal_pythonlib.text import escape_newlines, unescape_newlines
from markupsafe import escape, Markup
log = BraceStyleAdapter(logging.getLogger(__name__))
REGEX_WHITESPACE = re.compile(r"\s")
# =============================================================================
# Conversion to/from quoted SQL values
# =============================================================================
[docs]def encode_single_value(v: Any, is_blob=False) -> str:
"""
Encodes a value for incorporation into an SQL CSV value string.
Note that this also escapes newlines. That is not necessary when receiving
data from tablets, because those data arrive in CGI forms, but necessary
for the return journey to the tablet/webclient, because those data get sent
in a one-record-one-line format.
In the C++ client, the client-side counterpart to this function is
``fromSqlLiteral()`` in ``lib/convert.cpp``.
"""
if v is None:
return "NULL"
if is_blob:
return base64_64format_encode(v)
if isinstance(v, str):
return sql_quote_string(escape_newlines(v))
# for int, float, etc.:
return str(v)
[docs]def decode_single_value(v: str) -> Any:
"""
Takes a string representing an SQL value. Returns the value. Value
types/examples:
========== ===========================================================
int ``35``, ``-12``
float ``7.23``
str ``'hello, here''s an apostrophe'``
(starts and ends with a quote)
NULL ``NULL``
(case-insensitive)
BLOB ``X'4D7953514C'``
(hex-encoded; matches MySQL method;
https://dev.mysql.com/doc/refman/5.0/en/hexadecimal-literals.html)
BLOB ``64'TXlTUUw='``
(base-64-encoded; this notation is my invention)
========== ===========================================================
But
- we use ISO-8601 text for dates/times
In the C++ client, the client-side counterpart to this function is
``toSqlLiteral()`` in ``lib/convert.cpp``.
"""
if not v:
# shouldn't happen; treat it as a NULL
return None
if v.upper() == "NULL":
return None
# special BLOB encoding here
t = REGEX_WHITESPACE.sub("", v)
# t is a copy of v with all whitespace removed. We remove whitespace in
# some cases because some base-64 encoders insert newline characters
# (e.g. Titanium iOS).
if REGEX_HEX_XFORMAT.match(t):
# log.debug("MATCHES HEX-ENCODED BLOB")
return hex_xformat_decode(t)
if REGEX_BASE64_64FORMAT.match(t):
# log.debug("MATCHES BASE64-ENCODED BLOB")
return base64_64format_decode(t)
if len(v) >= 2 and v[0] == SQUOTE and v[-1] == SQUOTE:
# v is a quoted string
s = unescape_newlines(sql_dequote_string(v))
# s is the underlying string that the source started with
# log.debug("UNDERLYING STRING: {}", s)
return s
# Not a quoted string.
# int?
try:
return int(v)
except (TypeError, ValueError):
pass
# float?
try:
return float(v)
except (TypeError, ValueError):
pass
# Who knows; something odd. Allow it as a string. "Be conservative in what
# you send, liberal in what you accept", and all that.
return v
[docs]def decode_values(valuelist: str) -> List[Any]:
"""
Takes a SQL CSV value list and returns the corresponding list of decoded
values.
"""
# log.debug("decode_values: valuelist={}", valuelist)
v = [decode_single_value(v) for v in gen_items_from_sql_csv(valuelist)]
# log.debug("decode_values: values={}", v)
return v
# =============================================================================
# Escape for HTML/XML
# =============================================================================
[docs]def br_html(text: str) -> str:
r"""
Filter that escapes text safely whilst also converting \n to <br>.
"""
# https://stackoverflow.com/questions/2285507/converting-n-to-br-in-mako-files
# https://developer.mozilla.org/en-US/docs/Web/HTML/Element/br
return escape(text).replace("\n", Markup("<br>"))