head	1.9;
access;
symbols
	pkgsrc-2026Q1:1.9.0.4
	pkgsrc-2026Q1-base:1.9
	pkgsrc-2025Q4:1.9.0.2
	pkgsrc-2025Q4-base:1.9
	pkgsrc-2025Q3:1.8.0.2
	pkgsrc-2025Q3-base:1.8
	pkgsrc-2025Q2:1.7.0.2
	pkgsrc-2025Q2-base:1.7
	pkgsrc-2025Q1:1.6.0.14
	pkgsrc-2025Q1-base:1.6
	pkgsrc-2024Q4:1.6.0.12
	pkgsrc-2024Q4-base:1.6
	pkgsrc-2024Q3:1.6.0.10
	pkgsrc-2024Q3-base:1.6
	pkgsrc-2024Q2:1.6.0.8
	pkgsrc-2024Q2-base:1.6
	pkgsrc-2024Q1:1.6.0.6
	pkgsrc-2024Q1-base:1.6
	pkgsrc-2023Q4:1.6.0.4
	pkgsrc-2023Q4-base:1.6
	pkgsrc-2023Q3:1.6.0.2
	pkgsrc-2023Q3-base:1.6
	pkgsrc-2023Q2:1.1.0.4
	pkgsrc-2023Q2-base:1.1
	pkgsrc-2023Q1:1.1.0.2
	pkgsrc-2023Q1-base:1.1;
locks; strict;
comment	@# @;


1.9
date	2025.10.26.12.15.39;	author ryoon;	state Exp;
branches;
next	1.8;
commitid	ksU5Z0Ayw0T4L4gG;

1.8
date	2025.08.22.17.28.59;	author wiz;	state Exp;
branches;
next	1.7;
commitid	WnwsRq58UcC1AK7G;

1.7
date	2025.06.06.07.51.53;	author wiz;	state Exp;
branches;
next	1.6;
commitid	uuU2IdUq244yRNXF;

1.6
date	2023.07.18.18.47.53;	author nia;	state Exp;
branches;
next	1.5;
commitid	gFDlNZ0VuIeFDjxE;

1.5
date	2023.07.13.13.55.10;	author nia;	state Exp;
branches;
next	1.4;
commitid	0pJOaqpxfFI2bEwE;

1.4
date	2023.07.13.13.49.17;	author nia;	state Exp;
branches;
next	1.3;
commitid	YLzs5mHc2c0d9EwE;

1.3
date	2023.07.12.14.52.15;	author he;	state Exp;
branches;
next	1.2;
commitid	VbcIMf9f6YnOwwwE;

1.2
date	2023.07.11.06.09.29;	author nia;	state Exp;
branches;
next	1.1;
commitid	VjJhJB44xczwFlwE;

1.1
date	2023.03.13.14.17.12;	author wiz;	state Exp;
branches;
next	;
commitid	oh4WOpDIfy61eYgE;


desc
@@


1.9
log
@textproc/{py-,}sentencepiece: Update to 0.2.1

Changelog:
0.2.1:
Major changes

  * [Python] Supported wheels and builds for Python 3.13 and 3.14(rc1) #1134,
    #1127, #1121, #1111, #1110, #1104, #1103, #1099, #1091
  * [Python] Added an experimental support for free-threading. #1134, #1127,
    #1110 https://github.com/google/sentencepiece/tree/master/python#free-threading-support
  * [Python] Updated the supported Python version to 3.9 or later.

New features

  * [ALL]: Added new build mode to prevent the precompiled normalization
    rules being embedded in *.so and *.a. (-DSPM_DISABLE_EMBEDDED_DATA=ON).
  * This reduces the runtime size by approximately 1-2 MB. This mode is
    enabled to build python wheels. The rules are loaded as the data package.

Bug fixes & minor changes

  * [ALL]: Security fix to address a heap overflow issue that could occur
    when using a model containing an invalid precompiled normalization model.
  * [Python]: Deprecates the wheel package for Linux i686.
  * [Python]: Supported wheel for Windows Arm64. #1114
  * [Python]: Fixed the crash issue on batch decoding #1051
  * [ALL]: Updated the Unicode normalization rule with the latest ICU/Unicode
    rules.
  * [ALL]: Unused code and build mode cleanup.
@
text
@# $NetBSD: Makefile.common,v 1.8 2025/08/22 17:28:59 wiz Exp $
#
# used by textproc/sentencepiece/Makefile
# used by textproc/py-sentencepiece/Makefile

DISTNAME=	sentencepiece-0.2.1
CATEGORIES=	textproc
MASTER_SITES=	${MASTER_SITE_GITHUB:=google/}
GITHUB_PROJECT=	sentencepiece
GITHUB_TAG=	v${PKGVERSION_NOREV}

MAINTAINER=	pkgsrc-users@@NetBSD.org
HOMEPAGE=	https://github.com/google/sentencepiece/
COMMENT=	Unsupervised text tokenizer for Neural Network-based text generation
LICENSE=	apache-2.0

USE_LANGUAGES=		c c++
USE_CXX_FEATURES=	c++17

.include "../../mk/atomic64.mk"
@


1.8
log
@*sentencepiece*: fix patch usage

can't share patches because of different WRKSRC
@
text
@d1 1
a1 1
# $NetBSD: Makefile.common,v 1.7 2025/06/06 07:51:53 wiz Exp $
d6 1
a6 1
DISTNAME=	sentencepiece-0.2.0
d9 1
@


1.7
log
@{py-,}sentencepiece: update to 0.2.0
@
text
@d1 1
a1 1
# $NetBSD: Makefile.common,v 1.6 2023/07/18 18:47:53 nia Exp $
a17 2
DISTINFO_FILE=		${.CURDIR}/../../textproc/sentencepiece/distinfo
PATCHDIR=		${.CURDIR}/../../textproc/sentencepiece/patches
@


1.6
log
@textproc: Adapt packages (where possible) to USE_(CC|CXX)_FEATURES
@
text
@d1 1
a1 1
# $NetBSD: Makefile.common,v 1.5 2023/07/13 13:55:10 nia Exp $
d6 1
a6 1
DISTNAME=	sentencepiece-0.1.97
d18 2
@


1.5
log
@*: Revert two recent commits that dropped a cwrappers-enforced C++ standard
by packages that already use -std=c++XX until the discussion about C++
standard versions is resolved.

Requested by pkgsrc-pmc@@.
@
text
@d1 1
a1 1
# $NetBSD: Makefile.common,v 1.4 2023/07/13 13:49:17 nia Exp $
d16 2
a17 1
USE_LANGUAGES=	c c++17
@


1.4
log
@*: Remove all instances of GCC_REQD where my name is the most recent
in 'cvs annotate' (part 2)
@
text
@d1 1
a1 1
# $NetBSD: Makefile.common,v 1.3 2023/07/12 14:52:15 he Exp $
d16 1
a16 1
USE_LANGUAGES=	c c++
@


1.3
log
@sentencepiece: Use mk/atomic64.mk as that's required.
@
text
@d1 1
a1 1
# $NetBSD: Makefile.common,v 1.2 2023/07/11 06:09:29 nia Exp $
a17 3
# C++17
GCC_REQD+=	7

@


1.2
log
@sentencepiece: Require a C++17 compiler the proper way.
@
text
@d1 1
a1 1
# $NetBSD: Makefile.common,v 1.1 2023/03/13 14:17:12 wiz Exp $
d20 2
@


1.1
log
@textproc/sentencepiece: import sentencepiece-0.1.97

SentencePiece is an unsupervised text tokenizer and detokenizer
mainly for Neural Network-based text generation systems where the
vocabulary size is predetermined prior to the neural model training.
SentencePiece implements subword units (e.g., byte-pair-encoding
(BPE)) and unigram language model with the extension of direct
training from raw sentences. SentencePiece allows us to make a
purely end-to-end system that does not depend on language-specific
pre/postprocessing.
@
text
@d1 1
a1 1
# $NetBSD$
d16 4
a19 1
USE_LANGUAGES=	c c++17
@

