// Part of the Crubit project, under the Apache License v2.0 with LLVM
// Exceptions. See /LICENSE for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
use anyhow::{anyhow, Result};
use ffi_types::*;
use ir::*;
use itertools::Itertools;
use proc_macro2::TokenStream;
use quote::format_ident;
use quote::quote;
use std::iter::Iterator;
use std::panic::catch_unwind;
use std::process;
use syn::*;
/// FFI equivalent of `Bindings`.
pub struct FfiBindings {
rs_api: FfiU8SliceBox,
rs_api_impl: FfiU8SliceBox,
/// Deserializes IR from `json` and generates bindings source code.
/// This function panics on error.
/// Ownership:
/// * function doesn't take ownership of (in other words it borrows) the param `json`
/// * function passes ownership of the returned value to the caller
/// Safety:
/// * function expects that param `json` is a FfiU8Slice for a valid array of bytes with the
/// given size.
/// * function expects that param `json` doesn't change during the call.
pub unsafe extern "C" fn GenerateBindingsImpl(json: FfiU8Slice) -> FfiBindings {
catch_unwind(|| {
// It is ok to abort here.
let Bindings { rs_api, rs_api_impl } = generate_bindings(json.as_slice()).unwrap();
FfiBindings {
rs_api: FfiU8SliceBox::from_boxed_slice(rs_api.into_bytes().into_boxed_slice()),
rs_api_impl: FfiU8SliceBox::from_boxed_slice(
.unwrap_or_else(|_| process::abort())
/// Source code for generated bindings.
struct Bindings {
// Rust source code.
rs_api: String,
// C++ source code.
rs_api_impl: String,
fn generate_bindings(json: &[u8]) -> Result<Bindings> {
let ir = deserialize_ir(json)?;
let rs_api = generate_rs_api(&ir)?;
let rs_api_impl = generate_rs_api_impl(&ir)?;
Ok(Bindings { rs_api, rs_api_impl })
/// If we know the original C++ function is codegenned and already compatible with `extern "C"`
/// calling convention we skip creating/calling the C++ thunk since we can call the original C++
/// directly.
fn can_skip_cc_thunk(func: &Func) -> bool {
// Inline functions may not be codegenned in the C++ library since Clang doesn't know if Rust
// calls the function or not. Therefore in order to make inline functions callable from Rust we
// need to generate a C++ file that defines a thunk that delegates to the original inline
// function. When compiled, Clang will emit code for this thunk and Rust code will call the
// thunk when the user wants to call the original inline function.
// This is not great runtime-performance-wise in regular builds (inline function will not be
// inlined, there will always be a function call), but it is correct. ThinLTO builds will be
// able to see through the thunk and inline code across the language boundary. For non-ThinLTO
// builds we plan to implement <internal link> which removes the runtime performance overhead.
/// Generate Rust source code for a given Record.
fn generate_record(record: &Record) -> Result<TokenStream> {
let ident = make_ident(&record.identifier.identifier);
let field_idents =
record.fields.iter().map(|f| make_ident(&f.identifier.identifier)).collect_vec();
let field_types =
record.fields.iter().map(|f| format_rs_type(&f.type_)).collect::<Result<Vec<_>>>()?;
let field_accesses = record
.map(|f| {
if f.access == AccessSpecifier::Public {
quote! { pub }
} else {
quote! {}
Ok(quote! {
pub struct #ident {
#( #field_accesses #field_idents: #field_types, )*
fn generate_rs_api(ir: &IR) -> Result<String> {
let mut thunks = vec![];
let mut api_funcs = vec![];
for func in &ir.functions {
let mangled_name = &func.mangled_name;
let ident = make_ident(&func.identifier.identifier);
let thunk_ident = format_ident!("__rust_thunk__{}", &func.identifier.identifier);
// TODO(hlopko): do not emit `-> ()` when return type is void, it's implicit.
let return_type_name = format_rs_type(&func.return_type)?;
let param_idents =
func.params.iter().map(|p| make_ident(&p.identifier.identifier)).collect_vec();
let param_types =
func.params.iter().map(|p| format_rs_type(&p.type_)).collect::<Result<Vec<_>>>()?;
api_funcs.push(quote! {
pub fn #ident( #( #param_idents: #param_types ),* ) -> #return_type_name {
unsafe { crate::detail::#thunk_ident( #( #param_idents ),* ) }
let thunk_attr = if can_skip_cc_thunk(&func) {
quote! {#[link_name = #mangled_name]}
} else {
quote! {}
thunks.push(quote! {
pub(crate) fn #thunk_ident( #( #param_idents: #param_types ),* ) -> #return_type_name ;
let records = ir.records.iter().map(generate_record).collect::<Result<Vec<_>>>()?;
let mod_detail = if thunks.is_empty() {
quote! {}
} else {
quote! {
mod detail {
extern "C" {
#( #thunks )*
let result = quote! {
#( #api_funcs )*
#( #records )*
fn make_ident(ident: &str) -> Ident {
format_ident!("{}", ident)
fn format_rs_type(ty: &ir::IRType) -> Result<TokenStream> {
let ptr_fragment = match ty.rs_name.as_str() {
"*mut" => Some(quote! {*mut}),
"*const" => Some(quote! {*const}),
_ => None,
match ptr_fragment {
Some(ptr_fragment) => {
if ty.type_params.len() != 1 {
return Err(anyhow!(
"Invalid pointer type (need exactly 1 type parameter): {:?}",
let nested_type = format_rs_type(&ty.type_params[0])?;
Ok(quote! {#ptr_fragment #nested_type})
None => {
if ty.type_params.len() > 0 {
return Err(anyhow!("Type not yet supported: {:?}", ty));
let ident = make_ident(&ty.rs_name);
Ok(quote! {#ident})
fn format_cc_type(ty: &ir::IRType) -> Result<TokenStream> {
let const_fragment = if ty.cc_const {
quote! {const}
} else {
quote! {}
match ty.cc_name.as_str() {
"*" => {
if ty.type_params.len() != 1 {
return Err(anyhow!(
"Invalid pointer type (need exactly 1 type parameter): {:?}",
assert_eq!(ty.type_params.len(), 1);
let nested_type = format_cc_type(&ty.type_params[0])?;
Ok(quote! {#nested_type * #const_fragment})
ident => {
if ty.type_params.len() > 0 {
return Err(anyhow!("Type not yet supported: {:?}", ty));
let ident = make_ident(ident);
Ok(quote! {#ident #const_fragment})
fn generate_rs_api_impl(ir: &IR) -> Result<String> {
// This function uses quote! to generate C++ source code out of convenience. This is a bold idea
// so we have to continously evaluate if it still makes sense or the cost of working around
// differences in Rust and C++ tokens is greather than the value added.
// See rs_bindings_from_cc/ for a list
// of supported placeholders.
let mut thunks = vec![];
for func in &ir.functions {
if can_skip_cc_thunk(&func) {
let thunk_ident = format_ident!("__rust_thunk__{}", &func.identifier.identifier);
let ident = make_ident(&func.identifier.identifier);
let return_type_name = format_cc_type(&func.return_type)?;
let param_idents =
func.params.iter().map(|p| make_ident(&p.identifier.identifier)).collect_vec();
let param_types =
func.params.iter().map(|p| format_cc_type(&p.type_)).collect::<Result<Vec<_>>>()?;
thunks.push(quote! {
extern "C" #return_type_name #thunk_ident( #( #param_types #param_idents ),* ) {
return #ident( #( #param_idents ),* );
// In order to generate C++ thunk in all the cases Clang needs to be able to access declarations
// from public headers of the C++ library.
let includes = ir.used_headers.iter().map(|i| &;
let result = quote! {
#( __HASH_TOKEN__ include #includes __NEWLINE__)*
#( #thunks )*
mod tests {
use super::Result;
use super::{generate_rs_api, generate_rs_api_impl};
use ir::*;
use quote::quote;
use token_stream_printer::cc_tokens_to_string;
fn test_simple_function() -> Result<()> {
let ir = IR {
used_headers: vec![],
records: vec![],
functions: vec![Func {
identifier: Identifier { identifier: "add".to_string() },
mangled_name: "_Z3Addii".to_string(),
return_type: IRType {
rs_name: "i32".to_string(),
cc_name: "int".to_string(),
cc_const: false,
type_params: vec![],
params: vec![
FuncParam {
identifier: Identifier { identifier: "a".to_string() },
type_: IRType {
rs_name: "i32".to_string(),
cc_name: "int".to_string(),
cc_const: false,
type_params: vec![],
FuncParam {
identifier: Identifier { identifier: "b".to_string() },
type_: IRType {
rs_name: "i32".to_string(),
cc_name: "int".to_string(),
cc_const: false,
type_params: vec![],
is_inline: false,
quote! {
pub fn add(a: i32, b: i32) -> i32 {
unsafe { crate::detail::__rust_thunk__add(a, b) }
mod detail {
extern "C" {
#[link_name = "_Z3Addii"]
pub(crate) fn __rust_thunk__add(a: i32, b: i32) -> i32;
} // extern
} // mod detail
assert_eq!(generate_rs_api_impl(&ir)?, "");
fn test_inline_function() -> Result<()> {
let ir = IR {
records: vec![],
used_headers: vec![
HeaderName { name: "foo/bar.h".to_string() },
HeaderName { name: "foo/baz.h".to_string() },
functions: vec![Func {
identifier: Identifier { identifier: "add".to_string() },
mangled_name: "_Z3Addii".to_string(),
return_type: IRType {
rs_name: "i32".to_string(),
cc_name: "int".to_string(),
cc_const: false,
type_params: vec![],
params: vec![
FuncParam {
identifier: Identifier { identifier: "a".to_string() },
type_: IRType {
rs_name: "i32".to_string(),
cc_name: "int".to_string(),
cc_const: false,
type_params: vec![],
FuncParam {
identifier: Identifier { identifier: "b".to_string() },
type_: IRType {
rs_name: "i32".to_string(),
cc_name: "int".to_string(),
cc_const: false,
type_params: vec![],
is_inline: true,
quote! {#[inline(always)]
pub fn add(a: i32, b: i32) -> i32 {
unsafe { crate::detail::__rust_thunk__add(a, b) }
mod detail {
extern "C" {
pub(crate) fn __rust_thunk__add(a: i32, b: i32) -> i32;
} // extern
} // mod detail
cc_tokens_to_string(quote! {
__HASH_TOKEN__ include "foo/bar.h" __NEWLINE__
__HASH_TOKEN__ include "foo/baz.h" __NEWLINE__
extern "C" int __rust_thunk__add(int a, int b) {
return add(a, b);
fn test_simple_struct() -> Result<()> {
let ir = IR {
used_headers: vec![],
records: vec![Record {
identifier: Identifier { identifier: "SomeStruct".to_string() },
fields: vec![
Field {
identifier: Identifier { identifier: "public_int".to_string() },
type_: IRType {
rs_name: "i32".to_string(),
cc_name: "int".to_string(),
cc_const: false,
type_params: vec![],
access: AccessSpecifier::Public,
Field {
identifier: Identifier { identifier: "protected_int".to_string() },
type_: IRType {
rs_name: "i32".to_string(),
cc_name: "int".to_string(),
cc_const: false,
type_params: vec![],
access: AccessSpecifier::Protected,
Field {
identifier: Identifier { identifier: "private_int".to_string() },
type_: IRType {
rs_name: "i32".to_string(),
cc_name: "int".to_string(),
cc_const: false,
type_params: vec![],
access: AccessSpecifier::Private,
functions: vec![],
quote! {
pub struct SomeStruct {
pub public_int: i32,
protected_int: i32,
private_int: i32,
assert_eq!(generate_rs_api_impl(&ir)?, "");
fn test_ptr_func() -> Result<()> {
let ir = IR {
used_headers: vec![],
records: vec![],
functions: vec![Func {
identifier: Identifier { identifier: "Deref".to_string() },
mangled_name: "_Z5DerefPKPi".to_string(),
return_type: IRType {
rs_name: "*mut".to_string(),
cc_name: "*".to_string(),
cc_const: false,
type_params: vec![IRType {
rs_name: "i32".to_string(),
cc_name: "int".to_string(),
cc_const: false,
type_params: vec![],
params: vec![FuncParam {
identifier: Identifier { identifier: "p".to_string() },
type_: IRType {
rs_name: "*const".to_string(),
cc_name: "*".to_string(),
cc_const: false,
type_params: vec![IRType {
rs_name: "*mut".to_string(),
cc_name: "*".to_string(),
cc_const: true,
type_params: vec![IRType {
rs_name: "i32".to_string(),
cc_name: "int".to_string(),
cc_const: false,
type_params: vec![],
is_inline: true,
quote! {
pub fn Deref(p: *const *mut i32) -> *mut i32 {
unsafe { crate::detail::__rust_thunk__Deref(p) }
mod detail {
extern "C" {
pub(crate) fn __rust_thunk__Deref(p: *const *mut i32) -> *mut i32;
} // extern
} // mod detail
cc_tokens_to_string(quote! {
extern "C" int* __rust_thunk__Deref(int* const * p) {
return Deref(p);