from __future__ import annotations import typing as t import torch import transformers from transformers.utils import is_tf_available from transformers.utils import is_torch_available from transformers.pipelines import PIPELINE_REGISTRY from transformers.pipelines import TextClassificationPipeline if t.TYPE_CHECKING: from transformers.pipelines.base import GenericTensor MAX_LENGTH = 3000 text = """\ The three words that best describe Hunter Schafer's Vanity Fair Oscars party look? Less is more. Dressed in a bias-cut white silk skirt, a single ivory-colored feather and — crucially — nothing else, Schafer was bound to raise a few eyebrows. Google searches for the actor and model skyrocketed on Sunday night as her look hit social media. On Twitter, pictures of Schafer immediately received tens of thousands of likes, while her own Instagram post has now been liked more than 2 million times. Look of the Week: Zendaya steals the show at Louis Vuitton in head-to-toe tiger print But more than just creating a headline-grabbing moment, Schafer's ensemble was clearly considered. Fresh off the Fall-Winter 2023 runway, the look debuted earlier this month at fashion house Ann Demeulemeester's show in Paris. It was designed by Ludovic de Saint Sernin, the label's creative director since December. Celebrity fashion works best when there's a story behind a look. For example, the plausible Edie Sedgwick reference in Kendall Jenner's Bottega Veneta tights, or Paul Mescal winking at traditional masculinity in a plain white tank top. For his first Ann Demeulemeester collection, De Saint Sernin was inspired by "fashion-making as an authentic act of self-involvement." It was a love letter — almost literally — to the Belgian label's founder, with imagery of "authorship and autobiography" baked into the clothes (Sernin called his feather bandeaus "quills" in the show notes). Hunter Schafer's barely-there Oscars after party look was more poetic than it first seemed. These ideas of self-expression, self-love and self-definition took on new meaning when worn by Schafer. As a trans woman whose ascent to fame was inextricably linked to her gender identity — her big break was playing trans teenager Jules in HBO's "Euphoria" — Schafer's body is subjected to constant scrutiny online. The comment sections on her Instagram posts often descend into open forums, where users feel entitled (and seemingly compelled) to ask intimate questions about the trans experience or challenge Schafer's womanhood. Fittingly, there is a long lineage of gender-defying sentiments stitched into Schafer's outfit. Founded in 1985 by Ann Demeulemeester and her husband Patrick Robyn, the brand boasts a long legacy of gender-non-conforming fashion. "I was interested in the tension between masculine and feminine, but also the tension between masculine and feminine within one person," Demeulemeester told Vogue ahead of a retrospective exhibition of her work in Florence, Italy, last year. "That is what makes every person really interesting to me because everybody is unique." In his latest co-ed collection, De Saint Sernin — who is renowned in the industry for his eponymous, gender-fluid label — brought his androgynous world view to Ann Demeulemeester with fitted, romantic menswear silhouettes and sensual fabrics for all (think skin-tight mesh tops, leather, and open shirts made from a translucent organza material). Celebrity stylist Law Roach on dressing Zendaya and 'faking it 'till you make it' A quill strapped across her chest, Schafer let us know she is still writing her narrative — and defining herself on her own terms. There's an entire story contained in those two garments. As De Saint Sernin said in the show notes: "Thirty-six looks, each one a heartfelt sentence." The powerful ensemble may become one of Law Roach's last celebrity styling credits. Roach announced over social media on Tuesday that he would be retiring from the industry after 14 years of creating conversation-driving looks for the likes of Zendaya, Bella Hadid, Anya Taylor-Joy, Ariana Grande and Megan Thee Stallion.""" categories = [ "business", "entertainment", "politics", "sport", "technology", "world", "healthcare", "infrastructure", "education", "economy", "legal", "defence", "parliament", ] class MultiLengthTextClassificationPipeline(TextClassificationPipeline): _split_chunk_length = 510 def preprocess( self, inputs: str, **tokenizer_kwargs: t.Any ) -> dict[str, GenericTensor]: assert isinstance( inputs, str ), f"inputs currently only supports string as inputs (got {type(inputs)})" tokens = self.tokenizer.encode_plus( inputs, add_special_tokens=False, return_tensors="pt" ) # NOTE: egh we are copying this to list here, but we need to mutate these chunks, so tuple won't do it. input_id_chunks = list(tokens["input_ids"][0].split(self._split_chunk_length)) mask_chunks = list(tokens["attention_mask"][0].split(self._split_chunk_length)) # NOTE: we need to pad the last chunk to match the max length for i, (id_chunk, mask_chunk) in enumerate(zip(input_id_chunks, mask_chunks)): # get required padding length # bert length is usually 512 pad_len = 512 - id_chunk.shape[0] if pad_len > 0: # if padding length is more than 0, then pad input_id_chunks[i] = torch.cat([id_chunk, torch.Tensor([0] * pad_len)]) mask_chunks[i] = torch.cat([mask_chunk, torch.Tensor([0] * pad_len)]) input_ids = torch.stack(input_id_chunks) attention_mask = torch.stack(mask_chunks) return {"input_ids": input_ids.long(), "attention_mask": attention_mask.int()} PIPELINE_REGISTRY.register_pipeline( "multi-length-text-classification", pipeline_class=MultiLengthTextClassificationPipeline, pt_model=transformers.AutoModelForSequenceClassification if is_torch_available() else None, tf_model=transformers.TFAutoModelForSequenceClassification if is_tf_available() else None, default={ "pt": ("ProsusAI/finbert", "54bddcea"), "tf": ("ProsusAI/finbert", "54bddcea"), }, type="text", ) if __name__ == "__main__": from transformers import pipeline import bentoml # NOTE: Summarization models suggestions: # - sshleifer/distilbart-cnn-12-6 (default) # - google/pegasus-cnn_dailymail if you have a beefy GPU summarization_model = "sshleifer/distilbart-cnn-12-6" summarizer = pipeline("summarization", model=summarization_model) print("Summarized:", summarizer(text, max_length=MAX_LENGTH)[0]["summary_text"]) print( f"Saved summarizer model: {bentoml.transformers.save_model('summarizer-pipeline', summarizer, metadata=dict(model_name=summarization_model))}", ) print("\n", "=" * 50, "\n") # NOTE: Zero-shot classification models suggestions: # - facebook/bart-large-mnli (default) classification_model = "facebook/bart-large-mnli" classifier = pipeline("zero-shot-classification", model=classification_model) predicted = classifier(text, categories, multi_label=True) print( "Categories prediction:", {c: p for c, p in zip(predicted["labels"], predicted["scores"])}, ) print( f"Saved categorizer model: {bentoml.transformers.save_model('categorizer-pipeline', classifier, metadata=dict(model_name=classification_model))}", ) print("\n", "=" * 50, "\n") # NOTE: Sentiment analysis models suggestions: # - distilbert-base-uncased-finetuned-sst-2-english (default) # - bhadresh-savani/distilbert-base-uncased-emotion # - ProsusAI/finbert sentiment_model = "ProsusAI/finbert" sentimenter = pipeline( "multi-length-text-classification", model=sentiment_model, top_k=None ) print("Sentiment prediction:", sentimenter(text, max_length=MAX_LENGTH)) print( f"Saved sentimenter model: {bentoml.transformers.save_model('sentimenter-pipeline', sentimenter, metadata=dict(model_name=sentiment_model))}", )