mirror of https://github.com/zulip/zulip.git
84 lines
3.1 KiB
Python
84 lines
3.1 KiB
Python
"""
|
|
String Utilities:
|
|
|
|
This module helps in converting strings from one type to another.
|
|
|
|
Currently we have strings of 3 semantic types:
|
|
|
|
1. text strings: These strings are used to represent all textual data,
|
|
like people's names, stream names, content of messages, etc.
|
|
These strings can contain non-ASCII characters, so its type should be
|
|
typing.Text (which is `str` in python 3 and `unicode` in python 2).
|
|
|
|
2. binary strings: These strings are used to represent binary data.
|
|
This should be of type `bytes`
|
|
|
|
3. native strings: These strings are for internal use only. Strings of
|
|
this type are not meant to be stored in database, displayed to end
|
|
users, etc. Things like exception names, parameter names, attribute
|
|
names, etc should be native strings. These strings should only
|
|
contain ASCII characters and they should have type `str`.
|
|
|
|
There are 3 utility functions provided for converting strings from one type
|
|
to another - force_text, force_bytes, force_str
|
|
|
|
Interconversion between text strings and binary strings can be done by
|
|
using encode and decode appropriately or by using the utility functions
|
|
force_text and force_bytes.
|
|
|
|
It is recommended to use the utility functions for other string conversions.
|
|
"""
|
|
|
|
from typing import Any, Dict, Mapping, Union, TypeVar, Text
|
|
|
|
NonBinaryStr = TypeVar('NonBinaryStr', str, Text)
|
|
# This is used to represent text or native strings
|
|
|
|
def force_text(s: Union[Text, bytes], encoding: str='utf-8') -> Text:
|
|
"""converts a string to a text string"""
|
|
if isinstance(s, Text):
|
|
return s
|
|
elif isinstance(s, bytes):
|
|
return s.decode(encoding)
|
|
else:
|
|
raise TypeError("force_text expects a string type")
|
|
|
|
def force_bytes(s: Union[Text, bytes], encoding: str='utf-8') -> bytes:
|
|
"""converts a string to binary string"""
|
|
if isinstance(s, bytes):
|
|
return s
|
|
elif isinstance(s, Text):
|
|
return s.encode(encoding)
|
|
else:
|
|
raise TypeError("force_bytes expects a string type")
|
|
|
|
def force_str(s: Union[Text, bytes], encoding: str='utf-8') -> str:
|
|
"""converts a string to a native string"""
|
|
if isinstance(s, str):
|
|
return s
|
|
elif isinstance(s, Text):
|
|
return s.encode(encoding)
|
|
elif isinstance(s, bytes):
|
|
return s.decode(encoding)
|
|
else:
|
|
raise TypeError("force_str expects a string type")
|
|
|
|
class ModelReprMixin:
|
|
"""
|
|
This mixin provides a python 2 and 3 compatible way of handling string representation of a model.
|
|
When declaring a model, inherit this mixin before django.db.models.Model.
|
|
Define __unicode__ on your model which returns a typing.Text object.
|
|
This mixin will automatically define __str__ and __repr__.
|
|
"""
|
|
|
|
def __unicode__(self) -> Text:
|
|
# Originally raised an exception, but Django (e.g. the ./manage.py shell)
|
|
# was catching the exception and not displaying any sort of error
|
|
return "Implement __unicode__ in your subclass of ModelReprMixin!"
|
|
|
|
def __str__(self) -> str:
|
|
return force_str(self.__unicode__())
|
|
|
|
def __repr__(self) -> str:
|
|
return force_str(self.__unicode__())
|